1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1226cec326SBarry Smith #define TYPE AIJ 1326cec326SBarry Smith #define TYPE_BS 1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 1626cec326SBarry Smith #undef TYPE 1726cec326SBarry Smith #undef TYPE_BS 1826cec326SBarry Smith 19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 20d71ae5a4SJacob Faibussowitsch { 214099cc6bSBarry Smith PetscBool flg; 224099cc6bSBarry Smith char type[256]; 234099cc6bSBarry Smith 244099cc6bSBarry Smith PetscFunctionBegin; 25d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 269566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 279566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 28d0609cedSBarry Smith PetscOptionsEnd(); 293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 304099cc6bSBarry Smith } 314099cc6bSBarry Smith 32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 33d71ae5a4SJacob Faibussowitsch { 340716a85fSBarry Smith PetscInt i, m, n; 350716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 360716a85fSBarry Smith 370716a85fSBarry Smith PetscFunctionBegin; 389566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 399566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 400716a85fSBarry Smith if (type == NORM_2) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 420716a85fSBarry Smith } else if (type == NORM_1) { 43ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 440716a85fSBarry Smith } else if (type == NORM_INFINITY) { 45ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 47ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 506adde796SStefano Zampini } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 510716a85fSBarry Smith 520716a85fSBarry Smith if (type == NORM_2) { 53a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 54857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 55a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 560716a85fSBarry Smith } 573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 580716a85fSBarry Smith } 590716a85fSBarry Smith 60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 61d71ae5a4SJacob Faibussowitsch { 623a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 633a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 643a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 653a062f41SBarry Smith PetscInt *rows; 663a062f41SBarry Smith 673a062f41SBarry Smith PetscFunctionBegin; 683a062f41SBarry Smith for (i = 0; i < m; i++) { 69ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 723a062f41SBarry Smith cnt = 0; 733a062f41SBarry Smith for (i = 0; i < m; i++) { 743a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 753a062f41SBarry Smith rows[cnt] = i; 763a062f41SBarry Smith cnt++; 773a062f41SBarry Smith } 783a062f41SBarry Smith } 799566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 813a062f41SBarry Smith } 823a062f41SBarry Smith 83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 84d71ae5a4SJacob Faibussowitsch { 856ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 86fff043a9SJunchao Zhang const MatScalar *aa; 876ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 88b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 896ce1633cSBarry Smith PetscInt *rows; 906ce1633cSBarry Smith 916ce1633cSBarry Smith PetscFunctionBegin; 929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 939566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 946ce1633cSBarry Smith diag = a->diag; 956ce1633cSBarry Smith for (i = 0; i < m; i++) { 96ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 976ce1633cSBarry Smith } 989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 996ce1633cSBarry Smith cnt = 0; 1006ce1633cSBarry Smith for (i = 0; i < m; i++) { 101ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 1026ce1633cSBarry Smith } 103f1f41ecbSJed Brown *nrows = cnt; 104f1f41ecbSJed Brown *zrows = rows; 1059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 107f1f41ecbSJed Brown } 108f1f41ecbSJed Brown 109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 110d71ae5a4SJacob Faibussowitsch { 111f1f41ecbSJed Brown PetscInt nrows, *rows; 112f1f41ecbSJed Brown 113f1f41ecbSJed Brown PetscFunctionBegin; 1140298fd71SBarry Smith *zrows = NULL; 1159566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1169566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1186ce1633cSBarry Smith } 1196ce1633cSBarry Smith 120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 121d71ae5a4SJacob Faibussowitsch { 122b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 123b3a44c85SBarry Smith const MatScalar *aa; 124b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 125b3a44c85SBarry Smith const PetscInt *ii; 126b3a44c85SBarry Smith PetscInt n, i, j, *rows; 127b3a44c85SBarry Smith 128b3a44c85SBarry Smith PetscFunctionBegin; 1299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 130f4259b30SLisandro Dalcin *keptrows = NULL; 131b3a44c85SBarry Smith ii = a->i; 132b3a44c85SBarry Smith for (i = 0; i < m; i++) { 133b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 134b3a44c85SBarry Smith if (!n) { 135b3a44c85SBarry Smith cnt++; 136b3a44c85SBarry Smith goto ok1; 137b3a44c85SBarry Smith } 1382e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 139b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 140b3a44c85SBarry Smith } 141b3a44c85SBarry Smith cnt++; 142b3a44c85SBarry Smith ok1:; 143b3a44c85SBarry Smith } 1442e5835c6SStefano Zampini if (!cnt) { 1459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1472e5835c6SStefano Zampini } 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 149b3a44c85SBarry Smith cnt = 0; 150b3a44c85SBarry Smith for (i = 0; i < m; i++) { 151b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 152b3a44c85SBarry Smith if (!n) continue; 1532e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 154b3a44c85SBarry Smith if (aa[j] != 0.0) { 155b3a44c85SBarry Smith rows[cnt++] = i; 156b3a44c85SBarry Smith break; 157b3a44c85SBarry Smith } 158b3a44c85SBarry Smith } 159b3a44c85SBarry Smith } 1609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1619566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 1623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 163b3a44c85SBarry Smith } 164b3a44c85SBarry Smith 165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 166d71ae5a4SJacob Faibussowitsch { 16779299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16899e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16999e65526SBarry Smith const PetscInt *diag; 1702e5835c6SStefano Zampini MatScalar *aa; 17199e65526SBarry Smith const PetscScalar *v; 172ace3abfcSBarry Smith PetscBool missing; 17379299369SBarry Smith 17479299369SBarry Smith PetscFunctionBegin; 17509f38230SBarry Smith if (Y->assembled) { 1769566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 17709f38230SBarry Smith if (!missing) { 17879299369SBarry Smith diag = aij->diag; 1799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 18179299369SBarry Smith if (is == INSERT_VALUES) { 182ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 18379299369SBarry Smith } else { 184ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 18579299369SBarry Smith } 1869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 1883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18979299369SBarry Smith } 1909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 19109f38230SBarry Smith } 1929566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 1933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 19409f38230SBarry Smith } 19579299369SBarry Smith 196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 197d71ae5a4SJacob Faibussowitsch { 198416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19997f1f81fSBarry Smith PetscInt i, ishift; 20017ab2063SBarry Smith 2013a40ed3dSBarry Smith PetscFunctionBegin; 202f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 2033ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 204bfeeae90SHong Zhang ishift = 0; 205b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 2069566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 207bfeeae90SHong Zhang } else if (oshift == 1) { 2081a83f524SJed Brown PetscInt *tia; 209d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2103b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2121a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2131a83f524SJed Brown *ia = tia; 214ecc77c7aSBarry Smith if (ja) { 2151a83f524SJed Brown PetscInt *tja; 2169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2171a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2181a83f524SJed Brown *ja = tja; 219ecc77c7aSBarry Smith } 2206945ee14SBarry Smith } else { 221ecc77c7aSBarry Smith *ia = a->i; 222ecc77c7aSBarry Smith if (ja) *ja = a->j; 223a2ce50c7SBarry Smith } 2243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225a2744918SBarry Smith } 226a2744918SBarry Smith 227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 228d71ae5a4SJacob Faibussowitsch { 2293a40ed3dSBarry Smith PetscFunctionBegin; 2303ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 231b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2329566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2339566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 234bcd2baecSBarry Smith } 2353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23617ab2063SBarry Smith } 23717ab2063SBarry Smith 238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 239d71ae5a4SJacob Faibussowitsch { 2403b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 241d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 24297f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2433b2fbd54SBarry Smith 2443a40ed3dSBarry Smith PetscFunctionBegin; 245899cda47SBarry Smith *nn = n; 2463ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2473b2fbd54SBarry Smith if (symmetric) { 2489566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2493b2fbd54SBarry Smith } else { 2509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2533b2fbd54SBarry Smith jj = a->j; 254ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2553b2fbd54SBarry Smith cia[0] = oshift; 256ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2583b2fbd54SBarry Smith jj = a->j; 259a93ec695SBarry Smith for (row = 0; row < m; row++) { 260a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 261a93ec695SBarry Smith for (i = 0; i < mr; i++) { 262bfeeae90SHong Zhang col = *jj++; 2632205254eSKarl Rupp 2643b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2653b2fbd54SBarry Smith } 2663b2fbd54SBarry Smith } 2679566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2689371c9d4SSatish Balay *ia = cia; 2699371c9d4SSatish Balay *ja = cja; 2703b2fbd54SBarry Smith } 2713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2723b2fbd54SBarry Smith } 2733b2fbd54SBarry Smith 274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 275d71ae5a4SJacob Faibussowitsch { 2763a40ed3dSBarry Smith PetscFunctionBegin; 2773ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2783b2fbd54SBarry Smith 2799566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2809566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2823b2fbd54SBarry Smith } 2833b2fbd54SBarry Smith 2847cee066cSHong Zhang /* 2857cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2867cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 287040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2887cee066cSHong Zhang */ 289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 290d71ae5a4SJacob Faibussowitsch { 2917cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2927cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 293071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2947cee066cSHong Zhang PetscInt *cspidx; 295071fcb05SBarry Smith const PetscInt *jj; 2967cee066cSHong Zhang 2977cee066cSHong Zhang PetscFunctionBegin; 2987cee066cSHong Zhang *nn = n; 2993ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 300625f6d37SHong Zhang 3019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 3029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 3039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 3057cee066cSHong Zhang jj = a->j; 306ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 3077cee066cSHong Zhang cia[0] = oshift; 308ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3107cee066cSHong Zhang jj = a->j; 3117cee066cSHong Zhang for (row = 0; row < m; row++) { 3127cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3137cee066cSHong Zhang for (i = 0; i < mr; i++) { 3147cee066cSHong Zhang col = *jj++; 315071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 316071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 317071fcb05SBarry Smith cja[tmp] = row + oshift; 3187cee066cSHong Zhang } 3197cee066cSHong Zhang } 3209566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 321071fcb05SBarry Smith *ia = cia; 322071fcb05SBarry Smith *ja = cja; 3237cee066cSHong Zhang *spidx = cspidx; 3243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 328d71ae5a4SJacob Faibussowitsch { 3297cee066cSHong Zhang PetscFunctionBegin; 3309566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3319566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3337cee066cSHong Zhang } 3347cee066cSHong Zhang 335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 336d71ae5a4SJacob Faibussowitsch { 33787d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33887d4246cSBarry Smith PetscInt *ai = a->i; 339fff043a9SJunchao Zhang PetscScalar *aa; 34087d4246cSBarry Smith 34187d4246cSBarry Smith PetscFunctionBegin; 3429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34687d4246cSBarry Smith } 34787d4246cSBarry Smith 348bd04181cSBarry Smith /* 349bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 350bd04181cSBarry Smith 351bd04181cSBarry Smith - a single row of values is set with each call 352bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 353bd04181cSBarry Smith - the values are always added to the matrix, not set 354bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 355bd04181cSBarry Smith 3561f763a69SBarry Smith This does NOT assume the global column indices are sorted 357bd04181cSBarry Smith 3581f763a69SBarry Smith */ 359bd04181cSBarry Smith 360af0996ceSBarry Smith #include <petsc/private/isimpl.h> 361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 362d71ae5a4SJacob Faibussowitsch { 363189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3641f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3651f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3661f763a69SBarry Smith PetscInt lastcol = -1; 367fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 368189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 369189e4007SBarry Smith 370fff043a9SJunchao Zhang PetscFunctionBegin; 3719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 372f38dd0b8SBarry Smith row = ridx[im[0]]; 3731f763a69SBarry Smith rp = aj + ai[row]; 3741f763a69SBarry Smith ap = aa + ai[row]; 3751f763a69SBarry Smith nrow = ailen[row]; 376189e4007SBarry Smith low = 0; 377189e4007SBarry Smith high = nrow; 378189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 379189e4007SBarry Smith col = cidx[in[l]]; 380f38dd0b8SBarry Smith value = v[l]; 381189e4007SBarry Smith 382189e4007SBarry Smith if (col <= lastcol) low = 0; 383189e4007SBarry Smith else high = nrow; 384189e4007SBarry Smith lastcol = col; 385189e4007SBarry Smith while (high - low > 5) { 386189e4007SBarry Smith t = (low + high) / 2; 387189e4007SBarry Smith if (rp[t] > col) high = t; 388189e4007SBarry Smith else low = t; 389189e4007SBarry Smith } 390189e4007SBarry Smith for (i = low; i < high; i++) { 391189e4007SBarry Smith if (rp[i] == col) { 3921f763a69SBarry Smith ap[i] += value; 393189e4007SBarry Smith low = i + 1; 3941f763a69SBarry Smith break; 395189e4007SBarry Smith } 396189e4007SBarry Smith } 397189e4007SBarry Smith } 3989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3993ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 400189e4007SBarry Smith } 401189e4007SBarry Smith 402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 403d71ae5a4SJacob Faibussowitsch { 404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 405e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 40697f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 407e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 408ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 409ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 410ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 41117ab2063SBarry Smith 4123a40ed3dSBarry Smith PetscFunctionBegin; 4139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 41417ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 415416022c9SBarry Smith row = im[k]; 4165ef9f2a5SBarry Smith if (row < 0) continue; 4176bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 4188e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 4198e3a54c0SPierre Jolivet if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]); 4209371c9d4SSatish Balay rmax = imax[row]; 4219371c9d4SSatish Balay nrow = ailen[row]; 422416022c9SBarry Smith low = 0; 423c71e6ed7SBarry Smith high = nrow; 42417ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4255ef9f2a5SBarry Smith if (in[l] < 0) continue; 4266bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 427bfeeae90SHong Zhang col = in[l]; 428071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 429071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 43036db0b34SBarry Smith 4312205254eSKarl Rupp if (col <= lastcol) low = 0; 4322205254eSKarl Rupp else high = nrow; 433e2ee6c50SBarry Smith lastcol = col; 434416022c9SBarry Smith while (high - low > 5) { 435416022c9SBarry Smith t = (low + high) / 2; 436416022c9SBarry Smith if (rp[t] > col) high = t; 437416022c9SBarry Smith else low = t; 43817ab2063SBarry Smith } 439416022c9SBarry Smith for (i = low; i < high; i++) { 44017ab2063SBarry Smith if (rp[i] > col) break; 44117ab2063SBarry Smith if (rp[i] == col) { 442876c6284SHong Zhang if (!A->structure_only) { 4430c0d7e18SFande Kong if (is == ADD_VALUES) { 4440c0d7e18SFande Kong ap[i] += value; 4450c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4469371c9d4SSatish Balay } else ap[i] = value; 447720833daSHong Zhang } 448e44c0bd4SBarry Smith low = i + 1; 44917ab2063SBarry Smith goto noinsert; 45017ab2063SBarry Smith } 45117ab2063SBarry Smith } 452dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 453c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 45408401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 455720833daSHong Zhang if (A->structure_only) { 456876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 457720833daSHong Zhang } else { 458fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 459720833daSHong Zhang } 4609371c9d4SSatish Balay N = nrow++ - 1; 4619371c9d4SSatish Balay a->nz++; 4629371c9d4SSatish Balay high++; 463416022c9SBarry Smith /* shift up all the later entries in this row */ 4649566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 46517ab2063SBarry Smith rp[i] = col; 466580bdb30SBarry Smith if (!A->structure_only) { 4679566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 468580bdb30SBarry Smith ap[i] = value; 469580bdb30SBarry Smith } 470416022c9SBarry Smith low = i + 1; 471e56f5c9eSBarry Smith A->nonzerostate++; 472e44c0bd4SBarry Smith noinsert:; 47317ab2063SBarry Smith } 47417ab2063SBarry Smith ailen[row] = nrow; 47517ab2063SBarry Smith } 4769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 47817ab2063SBarry Smith } 47917ab2063SBarry Smith 480ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 481d71ae5a4SJacob Faibussowitsch { 48219b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 48319b08ed1SBarry Smith PetscInt *rp, k, row; 48419b08ed1SBarry Smith PetscInt *ai = a->i; 48519b08ed1SBarry Smith PetscInt *aj = a->j; 486fff043a9SJunchao Zhang MatScalar *aa, *ap; 48719b08ed1SBarry Smith 48819b08ed1SBarry Smith PetscFunctionBegin; 48928b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 49008401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 491fff043a9SJunchao Zhang 4929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 49319b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 49419b08ed1SBarry Smith row = im[k]; 49519b08ed1SBarry Smith rp = aj + ai[row]; 4968e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 49719b08ed1SBarry Smith 4989566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49919b08ed1SBarry Smith if (!A->structure_only) { 50019b08ed1SBarry Smith if (v) { 5019566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 50219b08ed1SBarry Smith v += n; 50319b08ed1SBarry Smith } else { 5049566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 50519b08ed1SBarry Smith } 50619b08ed1SBarry Smith } 50719b08ed1SBarry Smith a->ilen[row] = n; 50819b08ed1SBarry Smith a->imax[row] = n; 50919b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 51019b08ed1SBarry Smith a->nz += n; 51119b08ed1SBarry Smith } 5129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51419b08ed1SBarry Smith } 51519b08ed1SBarry Smith 51619b08ed1SBarry Smith /*@ 51719b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51819b08ed1SBarry Smith 51919b08ed1SBarry Smith Input Parameters: 52011a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 52119b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 52219b08ed1SBarry Smith 52319b08ed1SBarry Smith Level: advanced 52419b08ed1SBarry Smith 52519b08ed1SBarry Smith Notes: 52619b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 52711a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52819b08ed1SBarry Smith as always with multiple matrix assemblies. 52919b08ed1SBarry Smith 5301cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 53119b08ed1SBarry Smith @*/ 532d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 533d71ae5a4SJacob Faibussowitsch { 53419b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 53519b08ed1SBarry Smith 53619b08ed1SBarry Smith PetscFunctionBegin; 5379566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5389566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53919b08ed1SBarry Smith a->maxnz = nztotal; 5404dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 54119b08ed1SBarry Smith if (!a->ilen) { 5429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 54319b08ed1SBarry Smith } else { 5449566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 54519b08ed1SBarry Smith } 54619b08ed1SBarry Smith 54719b08ed1SBarry Smith /* allocate the matrix space */ 54819b08ed1SBarry Smith if (A->structure_only) { 5499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal, &a->j)); 5509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i)); 55119b08ed1SBarry Smith } else { 5529566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i)); 55319b08ed1SBarry Smith } 55419b08ed1SBarry Smith a->i[0] = 0; 55519b08ed1SBarry Smith if (A->structure_only) { 55619b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 55719b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55819b08ed1SBarry Smith } else { 55919b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 56019b08ed1SBarry Smith a->free_a = PETSC_TRUE; 56119b08ed1SBarry Smith } 56219b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 56319b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 56419b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 5653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56619b08ed1SBarry Smith } 56719b08ed1SBarry Smith 568ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 569d71ae5a4SJacob Faibussowitsch { 570071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 571071fcb05SBarry Smith PetscInt *rp, k, row; 572071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 573071fcb05SBarry Smith PetscInt *aj = a->j; 574fff043a9SJunchao Zhang MatScalar *aa, *ap; 575071fcb05SBarry Smith 576071fcb05SBarry Smith PetscFunctionBegin; 5779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 578071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 579071fcb05SBarry Smith row = im[k]; 5806bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 581071fcb05SBarry Smith rp = aj + ai[row]; 582071fcb05SBarry Smith ap = aa + ai[row]; 58348a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 584071fcb05SBarry Smith if (!A->structure_only) { 585071fcb05SBarry Smith if (v) { 5869566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 587071fcb05SBarry Smith v += n; 588071fcb05SBarry Smith } else { 5899566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 590071fcb05SBarry Smith } 591071fcb05SBarry Smith } 592071fcb05SBarry Smith ailen[row] = n; 593071fcb05SBarry Smith a->nz += n; 594071fcb05SBarry Smith } 5959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 597071fcb05SBarry Smith } 598071fcb05SBarry Smith 599ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 600d71ae5a4SJacob Faibussowitsch { 6017eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 60297f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 60397f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 6044e208921SJed Brown const MatScalar *ap, *aa; 6057eb43aa7SLois Curfman McInnes 6063a40ed3dSBarry Smith PetscFunctionBegin; 6074e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6087eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6097eb43aa7SLois Curfman McInnes row = im[k]; 6109371c9d4SSatish Balay if (row < 0) { 6119371c9d4SSatish Balay v += n; 6129371c9d4SSatish Balay continue; 6139371c9d4SSatish Balay } /* negative row */ 61454c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6158e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 6168e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 6177eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6187eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6199371c9d4SSatish Balay if (in[l] < 0) { 6209371c9d4SSatish Balay v++; 6219371c9d4SSatish Balay continue; 6229371c9d4SSatish Balay } /* negative column */ 62354c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 624bfeeae90SHong Zhang col = in[l]; 6259371c9d4SSatish Balay high = nrow; 6269371c9d4SSatish Balay low = 0; /* assume unsorted */ 6277eb43aa7SLois Curfman McInnes while (high - low > 5) { 6287eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6297eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6307eb43aa7SLois Curfman McInnes else low = t; 6317eb43aa7SLois Curfman McInnes } 6327eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6337eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6347eb43aa7SLois Curfman McInnes if (rp[i] == col) { 635b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6367eb43aa7SLois Curfman McInnes goto finished; 6377eb43aa7SLois Curfman McInnes } 6387eb43aa7SLois Curfman McInnes } 63997e567efSBarry Smith *v++ = 0.0; 6407eb43aa7SLois Curfman McInnes finished:; 6417eb43aa7SLois Curfman McInnes } 6427eb43aa7SLois Curfman McInnes } 6434e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6457eb43aa7SLois Curfman McInnes } 6467eb43aa7SLois Curfman McInnes 647ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 648d71ae5a4SJacob Faibussowitsch { 6493ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 650c898d852SStefano Zampini const PetscScalar *av; 6513ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6523ea6fe3dSLisandro Dalcin PetscInt *rowlens; 65317ab2063SBarry Smith 6543a40ed3dSBarry Smith PetscFunctionBegin; 6559566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6562205254eSKarl Rupp 6573ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6583ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6593ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6603ea6fe3dSLisandro Dalcin nz = A->nz; 661416022c9SBarry Smith 6623ea6fe3dSLisandro Dalcin /* write matrix header */ 6633ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6649371c9d4SSatish Balay header[1] = M; 6659371c9d4SSatish Balay header[2] = N; 6669371c9d4SSatish Balay header[3] = nz; 6679566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 668416022c9SBarry Smith 6693ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6709566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6713ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6729566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6739566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6743ea6fe3dSLisandro Dalcin /* store column indices */ 6759566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 676416022c9SBarry Smith /* store nonzero values */ 6779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6789566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 680b37d52dbSMark F. Adams 6813ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6829566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 68417ab2063SBarry Smith } 685416022c9SBarry Smith 686d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 687d71ae5a4SJacob Faibussowitsch { 6887dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6897dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6907dc0baabSHong Zhang 6917dc0baabSHong Zhang PetscFunctionBegin; 6929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6937dc0baabSHong Zhang for (i = 0; i < m; i++) { 6949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 69548a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6977dc0baabSHong Zhang } 6989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7007dc0baabSHong Zhang } 7017dc0baabSHong Zhang 70209573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 703cd155464SBarry Smith 704ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 705d71ae5a4SJacob Faibussowitsch { 706416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 707c898d852SStefano Zampini const PetscScalar *av; 70860e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 709e060cb09SBarry Smith const char *name; 710f3ef73ceSBarry Smith PetscViewerFormat format; 71117ab2063SBarry Smith 7123a40ed3dSBarry Smith PetscFunctionBegin; 7137dc0baabSHong Zhang if (A->structure_only) { 7149566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7167dc0baabSHong Zhang } 71743e49210SHong Zhang 7189566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 7193ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 7202e5835c6SStefano Zampini 721c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 72471c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 72597f1f81fSBarry Smith PetscInt nofinalvalue = 0; 72660e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 727c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 728d00d2cf4SBarry Smith nofinalvalue = 1; 729d00d2cf4SBarry Smith } 7309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 733fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 735fbfe6fa7SJed Brown #else 7369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 737fbfe6fa7SJed Brown #endif 7389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73917ab2063SBarry Smith 74017ab2063SBarry Smith for (i = 0; i < m; i++) { 74160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 742aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7439566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 74417ab2063SBarry Smith #else 7459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 74617ab2063SBarry Smith #endif 74717ab2063SBarry Smith } 74817ab2063SBarry Smith } 749d00d2cf4SBarry Smith if (nofinalvalue) { 750c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 752c337ccceSJed Brown #else 7539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 754c337ccceSJed Brown #endif 755d00d2cf4SBarry Smith } 7569566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 759fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7609566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 76144cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7629566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 76360e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 764aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 76536db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76736db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76936db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7716831982aSBarry Smith } 77244cd7ae7SLois Curfman McInnes #else 7739566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 77444cd7ae7SLois Curfman McInnes #endif 77544cd7ae7SLois Curfman McInnes } 7769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77744cd7ae7SLois Curfman McInnes } 7789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 779fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 78097f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7819566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 783496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 784496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 78560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 786496be53dSLois Curfman McInnes if (a->j[j] >= i) { 787aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78836db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 789496be53dSLois Curfman McInnes #else 790496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 791496be53dSLois Curfman McInnes #endif 792496be53dSLois Curfman McInnes } 793496be53dSLois Curfman McInnes } 794496be53dSLois Curfman McInnes } 7952e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7972e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7982205254eSKarl Rupp if (i + 4 < m) { 7999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 8002205254eSKarl Rupp } else if (i + 3 < m) { 8019566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 8022205254eSKarl Rupp } else if (i + 2 < m) { 8039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 8042205254eSKarl Rupp } else if (i + 1 < m) { 8059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 8062205254eSKarl Rupp } else if (i < m) { 8079566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8082205254eSKarl Rupp } else { 8099566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8102205254eSKarl Rupp } 811496be53dSLois Curfman McInnes } 8129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8139566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 814496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8169566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 817496be53dSLois Curfman McInnes } 8189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 819496be53dSLois Curfman McInnes } 8209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 821496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 82260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 823496be53dSLois Curfman McInnes if (a->j[j] >= i) { 824aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 82548a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 826496be53dSLois Curfman McInnes #else 8279566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 828496be53dSLois Curfman McInnes #endif 829496be53dSLois Curfman McInnes } 830496be53dSLois Curfman McInnes } 8319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 832496be53dSLois Curfman McInnes } 8339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 834fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 83597f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 83687828ca2SBarry Smith PetscScalar value; 83768f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83868f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83968f1ed48SBarry Smith 84068f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 84168f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 84268f1ed48SBarry Smith realonly = PETSC_FALSE; 84368f1ed48SBarry Smith break; 84468f1ed48SBarry Smith } 84568f1ed48SBarry Smith } 84668f1ed48SBarry Smith #endif 84702594712SBarry Smith 8489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84902594712SBarry Smith for (i = 0; i < m; i++) { 85002594712SBarry Smith jcnt = 0; 851d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 852e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 85302594712SBarry Smith value = a->a[cnt++]; 854e24b481bSBarry Smith jcnt++; 85502594712SBarry Smith } else { 85602594712SBarry Smith value = 0.0; 85702594712SBarry Smith } 858aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85968f1ed48SBarry Smith if (realonly) { 8609566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 86168f1ed48SBarry Smith } else { 8629566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 86368f1ed48SBarry Smith } 86402594712SBarry Smith #else 8659566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 86602594712SBarry Smith #endif 86702594712SBarry Smith } 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86902594712SBarry Smith } 8709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8713c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 872150b93efSMatthew G. Knepley PetscInt fshift = 1; 8739566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8743c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8759566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8763c215bfdSMatthew Knepley #else 8779566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8783c215bfdSMatthew Knepley #endif 8799566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8803c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 88160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8823c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8839566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8843c215bfdSMatthew Knepley #else 8859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8863c215bfdSMatthew Knepley #endif 8873c215bfdSMatthew Knepley } 8883c215bfdSMatthew Knepley } 8899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8903a40ed3dSBarry Smith } else { 8919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 892d5f3da31SBarry Smith if (A->factortype) { 89316cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 89516cd7e1dSShri Abhyankar /* L part */ 89660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89716cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89816cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 90016cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9019566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 90216cd7e1dSShri Abhyankar } else { 9039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 90416cd7e1dSShri Abhyankar } 90516cd7e1dSShri Abhyankar #else 9069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90716cd7e1dSShri Abhyankar #endif 90816cd7e1dSShri Abhyankar } 90916cd7e1dSShri Abhyankar /* diagonal */ 91016cd7e1dSShri Abhyankar j = a->diag[i]; 91116cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91216cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 91416cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 91616cd7e1dSShri Abhyankar } else { 9179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91816cd7e1dSShri Abhyankar } 91916cd7e1dSShri Abhyankar #else 9209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 92116cd7e1dSShri Abhyankar #endif 92216cd7e1dSShri Abhyankar 92316cd7e1dSShri Abhyankar /* U part */ 92460e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 92516cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 92616cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92816cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 93016cd7e1dSShri Abhyankar } else { 9319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 93216cd7e1dSShri Abhyankar } 93316cd7e1dSShri Abhyankar #else 9349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 93516cd7e1dSShri Abhyankar #endif 93616cd7e1dSShri Abhyankar } 9379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93816cd7e1dSShri Abhyankar } 93916cd7e1dSShri Abhyankar } else { 94017ab2063SBarry Smith for (i = 0; i < m; i++) { 9419566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 94260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 943aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 94436db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 94636db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9479566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9483a40ed3dSBarry Smith } else { 9499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 95017ab2063SBarry Smith } 95117ab2063SBarry Smith #else 9529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 95317ab2063SBarry Smith #endif 95417ab2063SBarry Smith } 9559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 95617ab2063SBarry Smith } 95716cd7e1dSShri Abhyankar } 9589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95917ab2063SBarry Smith } 9609566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 962416022c9SBarry Smith } 963416022c9SBarry Smith 9649804daf3SBarry Smith #include <petscdraw.h> 965ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 966d71ae5a4SJacob Faibussowitsch { 967480ef9eaSBarry Smith Mat A = (Mat)Aa; 968416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 969383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 970383922c3SLisandro Dalcin int color; 971b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 972b0a32e0cSBarry Smith PetscViewer viewer; 973f3ef73ceSBarry Smith PetscViewerFormat format; 974fff043a9SJunchao Zhang const PetscScalar *aa; 975cddf8d76SBarry Smith 9763a40ed3dSBarry Smith PetscFunctionBegin; 9779566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9789566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9799566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 980383922c3SLisandro Dalcin 981416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 983fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 984d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9850513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 986b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 987416022c9SBarry Smith for (i = 0; i < m; i++) { 9889371c9d4SSatish Balay y_l = m - i - 1.0; 9899371c9d4SSatish Balay y_r = y_l + 1.0; 990bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9919371c9d4SSatish Balay x_l = a->j[j]; 9929371c9d4SSatish Balay x_r = x_l + 1.0; 993fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9949566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 995cddf8d76SBarry Smith } 996cddf8d76SBarry Smith } 997b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 998cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9999371c9d4SSatish Balay y_l = m - i - 1.0; 10009371c9d4SSatish Balay y_r = y_l + 1.0; 1001bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10029371c9d4SSatish Balay x_l = a->j[j]; 10039371c9d4SSatish Balay x_r = x_l + 1.0; 1004fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10059566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1006cddf8d76SBarry Smith } 1007cddf8d76SBarry Smith } 1008b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1009cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10109371c9d4SSatish Balay y_l = m - i - 1.0; 10119371c9d4SSatish Balay y_r = y_l + 1.0; 1012bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10139371c9d4SSatish Balay x_l = a->j[j]; 10149371c9d4SSatish Balay x_r = x_l + 1.0; 1015fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10169566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1017416022c9SBarry Smith } 1018416022c9SBarry Smith } 1019d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10200513a670SBarry Smith } else { 10210513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10220513a670SBarry Smith /* first determine max of all nonzero values */ 1023b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1024383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1025b0a32e0cSBarry Smith PetscDraw popup; 10260513a670SBarry Smith 10270513a670SBarry Smith for (i = 0; i < nz; i++) { 1028fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10290513a670SBarry Smith } 1030383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10319566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10329566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1033383922c3SLisandro Dalcin 1034d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10350513a670SBarry Smith for (i = 0; i < m; i++) { 1036383922c3SLisandro Dalcin y_l = m - i - 1.0; 1037383922c3SLisandro Dalcin y_r = y_l + 1.0; 1038bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1039383922c3SLisandro Dalcin x_l = a->j[j]; 1040383922c3SLisandro Dalcin x_r = x_l + 1.0; 1041fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10429566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10430513a670SBarry Smith count++; 10440513a670SBarry Smith } 10450513a670SBarry Smith } 1046d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10470513a670SBarry Smith } 10489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 10493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1050480ef9eaSBarry Smith } 1051cddf8d76SBarry Smith 10529804daf3SBarry Smith #include <petscdraw.h> 1053ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1054d71ae5a4SJacob Faibussowitsch { 1055b0a32e0cSBarry Smith PetscDraw draw; 105636db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1057ace3abfcSBarry Smith PetscBool isnull; 1058480ef9eaSBarry Smith 1059480ef9eaSBarry Smith PetscFunctionBegin; 10609566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10619566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 10623ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 1063480ef9eaSBarry Smith 10649371c9d4SSatish Balay xr = A->cmap->n; 10659371c9d4SSatish Balay yr = A->rmap->n; 10669371c9d4SSatish Balay h = yr / 10.0; 10679371c9d4SSatish Balay w = xr / 10.0; 10689371c9d4SSatish Balay xr += w; 10699371c9d4SSatish Balay yr += h; 10709371c9d4SSatish Balay xl = -w; 10719371c9d4SSatish Balay yl = -h; 10729566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10739566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10749566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10759566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10769566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1078416022c9SBarry Smith } 1079416022c9SBarry Smith 1080d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1081d71ae5a4SJacob Faibussowitsch { 1082ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1083416022c9SBarry Smith 10843a40ed3dSBarry Smith PetscFunctionBegin; 10859566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10869566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10879566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10881baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10891baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10901baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10919566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 109317ab2063SBarry Smith } 109419bcc07fSBarry Smith 1095d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1096d71ae5a4SJacob Faibussowitsch { 1097416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1098580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1099bc43efbbSJunchao Zhang PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0, n; 110054f21887SBarry Smith MatScalar *aa = a->a, *ap; 11013447b6efSHong Zhang PetscReal ratio = 0.6; 110217ab2063SBarry Smith 11033a40ed3dSBarry Smith PetscFunctionBegin; 11043ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 11059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1106b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1107b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11089566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1110b215bc84SStefano Zampini } 111117ab2063SBarry Smith 111243ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 111317ab2063SBarry Smith for (i = 1; i < m; i++) { 1114416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 111517ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 111694a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111717ab2063SBarry Smith if (fshift) { 1118bfeeae90SHong Zhang ip = aj + ai[i]; 1119bfeeae90SHong Zhang ap = aa + ai[i]; 112017ab2063SBarry Smith N = ailen[i]; 11219566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 112248a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 112317ab2063SBarry Smith } 112417ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 112517ab2063SBarry Smith } 112617ab2063SBarry Smith if (m) { 112717ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112817ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112917ab2063SBarry Smith } 113017ab2063SBarry Smith /* reset ilen and imax for each row */ 11317b083b7cSBarry Smith a->nonzerorowcnt = 0; 1132396832f4SHong Zhang if (A->structure_only) { 11339566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11349566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1135396832f4SHong Zhang } else { /* !A->structure_only */ 113617ab2063SBarry Smith for (i = 0; i < m; i++) { 113717ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11387b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113917ab2063SBarry Smith } 1140396832f4SHong Zhang } 1141bfeeae90SHong Zhang a->nz = ai[m]; 1142aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 1143bc43efbbSJunchao Zhang PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly 1144bc43efbbSJunchao Zhang a->diagonaldense = PETSC_TRUE; 1145bc43efbbSJunchao Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1146bc43efbbSJunchao Zhang for (i = 0; i < n; i++) { 1147bc43efbbSJunchao Zhang if (a->diag[i] >= ai[i + 1]) { 1148bc43efbbSJunchao Zhang a->diagonaldense = PETSC_FALSE; 1149bc43efbbSJunchao Zhang break; 1150bc43efbbSJunchao Zhang } 1151bc43efbbSJunchao Zhang } 11529566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11539566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11549566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11552205254eSKarl Rupp 11568e58a170SBarry Smith A->info.mallocs += a->reallocs; 1157dd5f02e7SSatish Balay a->reallocs = 0; 11586712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 115936db0b34SBarry Smith a->rmax = rmax; 11604e220ebcSLois Curfman McInnes 116148a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11629566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 116417ab2063SBarry Smith } 116517ab2063SBarry Smith 1166ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1167d71ae5a4SJacob Faibussowitsch { 116899cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 116999cafbc1SBarry Smith PetscInt i, nz = a->nz; 11702e5835c6SStefano Zampini MatScalar *aa; 117199cafbc1SBarry Smith 117299cafbc1SBarry Smith PetscFunctionBegin; 11739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117499cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 117899cafbc1SBarry Smith } 117999cafbc1SBarry Smith 1180ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1181d71ae5a4SJacob Faibussowitsch { 118299cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 118399cafbc1SBarry Smith PetscInt i, nz = a->nz; 11842e5835c6SStefano Zampini MatScalar *aa; 118599cafbc1SBarry Smith 118699cafbc1SBarry Smith PetscFunctionBegin; 11879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 118899cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119299cafbc1SBarry Smith } 119399cafbc1SBarry Smith 1194d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1195d71ae5a4SJacob Faibussowitsch { 1196fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1197fff043a9SJunchao Zhang MatScalar *aa; 11983a40ed3dSBarry Smith 11993a40ed3dSBarry Smith PetscFunctionBegin; 12009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 12019566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 12029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 12039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 12043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 120517ab2063SBarry Smith } 1206416022c9SBarry Smith 1207d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1208d71ae5a4SJacob Faibussowitsch { 1209416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1210d5d45c9bSBarry Smith 12113a40ed3dSBarry Smith PetscFunctionBegin; 1212b4e2f619SBarry Smith if (A->hash_active) { 1213e3c72094SPierre Jolivet A->ops[0] = a->cops; 1214b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 1215b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 1216b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 1217b4e2f619SBarry Smith } 1218b4e2f619SBarry Smith 12193ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz)); 12209566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12219566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12229566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12239566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12259566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12269566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12289566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12299566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12309566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12319566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12329566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12339566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12349566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1235901853e0SKris Buschelman 12366718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12376718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12386718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12396718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12406718818eSStefano Zampini due to different matrix sizes */ 12419566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12426718818eSStefano Zampini 12439566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12442e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12452e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12522e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12532e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12542e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12552e956fe4SStefano Zampini #endif 12564222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12604222ddf1SHong Zhang #endif 1261d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 1262d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL)); 1263d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL)); 1264d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL)); 1265d5e393b6SSuyash Tandon #endif 12663d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12683d0639e7SStefano Zampini #endif 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1270af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1272af8000cdSHong Zhang #endif 1273d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1275d24d4204SJose E. Roman #endif 127663c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 127963c07aadSStefano Zampini #endif 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12842e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12952e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12962e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12972e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12982e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 12992e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 13002e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 13012e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 13023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 130317ab2063SBarry Smith } 130417ab2063SBarry Smith 1305d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1306d71ae5a4SJacob Faibussowitsch { 1307416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13083a40ed3dSBarry Smith 13093a40ed3dSBarry Smith PetscFunctionBegin; 1310a65d3064SKris Buschelman switch (op) { 1311d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1312d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1313d71ae5a4SJacob Faibussowitsch break; 1314d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1315d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1316d71ae5a4SJacob Faibussowitsch break; 1317d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1318d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1319d71ae5a4SJacob Faibussowitsch break; 1320d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1321d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1322d71ae5a4SJacob Faibussowitsch break; 1323d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1324d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1325d71ae5a4SJacob Faibussowitsch break; 1326d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1327d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1328d71ae5a4SJacob Faibussowitsch break; 1329d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1330d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1331d71ae5a4SJacob Faibussowitsch break; 13323d472b54SHong Zhang case MAT_SPD: 1333b1646e73SJed Brown case MAT_SYMMETRIC: 1334b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1335b1646e73SJed Brown case MAT_HERMITIAN: 1336b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1337957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1338b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1339b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1340b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13415021d80fSJed Brown break; 13428c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1343a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1344d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1345d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1346d71ae5a4SJacob Faibussowitsch break; 1347d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1348d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1349d71ae5a4SJacob Faibussowitsch break; 1350d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1351d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1352d71ae5a4SJacob Faibussowitsch break; 1353071fcb05SBarry Smith case MAT_SORTED_FULL: 1354071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1355071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1356071fcb05SBarry Smith break; 1357d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1358d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1359d71ae5a4SJacob Faibussowitsch break; 1360d71ae5a4SJacob Faibussowitsch default: 1361d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1362a65d3064SKris Buschelman } 13633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 136417ab2063SBarry Smith } 136517ab2063SBarry Smith 1366ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1367d71ae5a4SJacob Faibussowitsch { 1368416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1369fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1370c898d852SStefano Zampini PetscScalar *x; 1371c898d852SStefano Zampini const PetscScalar *aa; 137217ab2063SBarry Smith 13733a40ed3dSBarry Smith PetscFunctionBegin; 13749566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 137508401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1377d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1378d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13799566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13802c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13819566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 138435e7444dSHong Zhang } 138535e7444dSHong Zhang 13869566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 138735e7444dSHong Zhang for (i = 0; i < n; i++) { 1388fdc842d1SBarry Smith x[i] = 0.0; 138935e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 139035e7444dSHong Zhang if (aj[j] == i) { 139135e7444dSHong Zhang x[i] = aa[j]; 139217ab2063SBarry Smith break; 139317ab2063SBarry Smith } 139417ab2063SBarry Smith } 139517ab2063SBarry Smith } 13969566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 139917ab2063SBarry Smith } 140017ab2063SBarry Smith 1401c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1403d71ae5a4SJacob Faibussowitsch { 1404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 14055f22a7b3SSebastian Grimberg const MatScalar *aa; 1406d9ca1df4SBarry Smith PetscScalar *y; 1407d9ca1df4SBarry Smith const PetscScalar *x; 1408d0f46423SBarry Smith PetscInt m = A->rmap->n; 14095c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14105f22a7b3SSebastian Grimberg const MatScalar *v; 1411a77337e4SBarry Smith PetscScalar alpha; 1412d9ca1df4SBarry Smith PetscInt n, i, j; 1413d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14143447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1415ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14165c897100SBarry Smith #endif 141717ab2063SBarry Smith 14183a40ed3dSBarry Smith PetscFunctionBegin; 14199566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14209566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14219566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14235c897100SBarry Smith 14245c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1425fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14265c897100SBarry Smith #else 14273447b6efSHong Zhang if (usecprow) { 14283447b6efSHong Zhang m = cprow.nrows; 14293447b6efSHong Zhang ii = cprow.i; 14307b2bb3b9SHong Zhang ridx = cprow.rindex; 14313447b6efSHong Zhang } else { 14323447b6efSHong Zhang ii = a->i; 14333447b6efSHong Zhang } 143417ab2063SBarry Smith for (i = 0; i < m; i++) { 14353447b6efSHong Zhang idx = a->j + ii[i]; 1436fff043a9SJunchao Zhang v = aa + ii[i]; 14373447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14383447b6efSHong Zhang if (usecprow) { 14397b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14403447b6efSHong Zhang } else { 144117ab2063SBarry Smith alpha = x[i]; 14423447b6efSHong Zhang } 144304fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 144417ab2063SBarry Smith } 14455c897100SBarry Smith #endif 14469566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14479566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14489566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 145117ab2063SBarry Smith } 145217ab2063SBarry Smith 1453d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1454d71ae5a4SJacob Faibussowitsch { 14555c897100SBarry Smith PetscFunctionBegin; 14569566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14579566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14595c897100SBarry Smith } 14605c897100SBarry Smith 1461c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 146278b84d54SShri Abhyankar 1463d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1464d71ae5a4SJacob Faibussowitsch { 1465416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1466d9fead3dSBarry Smith PetscScalar *y; 146754f21887SBarry Smith const PetscScalar *x; 1468fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1469003131ecSBarry Smith PetscInt m = A->rmap->n; 14700298fd71SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 14717b083b7cSBarry Smith PetscInt n, i; 1472362ced78SSatish Balay PetscScalar sum; 1473ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 147417ab2063SBarry Smith 1475b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 147697952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1477fee21e36SBarry Smith #endif 1478fee21e36SBarry Smith 14793a40ed3dSBarry Smith PetscFunctionBegin; 1480b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14819566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 14823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1483b215bc84SStefano Zampini } 14849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14859566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14869566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1487416022c9SBarry Smith ii = a->i; 14884eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14899566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 149097952fefSHong Zhang m = a->compressedrow.nrows; 149197952fefSHong Zhang ii = a->compressedrow.i; 149297952fefSHong Zhang ridx = a->compressedrow.rindex; 149397952fefSHong Zhang for (i = 0; i < m; i++) { 149497952fefSHong Zhang n = ii[i + 1] - ii[i]; 149597952fefSHong Zhang aj = a->j + ii[i]; 1496fff043a9SJunchao Zhang aa = a_a + ii[i]; 149797952fefSHong Zhang sum = 0.0; 1498003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1499003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 150097952fefSHong Zhang y[*ridx++] = sum; 150197952fefSHong Zhang } 150297952fefSHong Zhang } else { /* do not use compressed row format */ 1503b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 15043d3eaba7SBarry Smith aj = a->j; 1505fff043a9SJunchao Zhang aa = a_a; 1506b05257ddSBarry Smith fortranmultaij_(&m, x, ii, aj, aa, y); 1507b05257ddSBarry Smith #else 150817ab2063SBarry Smith for (i = 0; i < m; i++) { 1509003131ecSBarry Smith n = ii[i + 1] - ii[i]; 1510003131ecSBarry Smith aj = a->j + ii[i]; 1511fff043a9SJunchao Zhang aa = a_a + ii[i]; 151217ab2063SBarry Smith sum = 0.0; 1513003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 151417ab2063SBarry Smith y[i] = sum; 151517ab2063SBarry Smith } 15168d195f9aSBarry Smith #endif 1517b05257ddSBarry Smith } 15189566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15209566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 152317ab2063SBarry Smith } 152417ab2063SBarry Smith 1525ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1526ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1527d71ae5a4SJacob Faibussowitsch { 1528b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1529b434eb95SMatthew G. Knepley PetscScalar *y; 1530b434eb95SMatthew G. Knepley const PetscScalar *x; 1531fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1532b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1533b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1534b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1535b434eb95SMatthew G. Knepley PetscScalar sum; 1536b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1537b434eb95SMatthew G. Knepley 1538b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1539b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1540b434eb95SMatthew G. Knepley #endif 1541b434eb95SMatthew G. Knepley 1542b434eb95SMatthew G. Knepley PetscFunctionBegin; 15439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15449566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15459566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1546b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1547b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1548b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1549b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1550b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1551b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1552b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1553fff043a9SJunchao Zhang aa = a_a + ii[i]; 1554b434eb95SMatthew G. Knepley sum = 0.0; 1555b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1556b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1557b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1558b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1559b434eb95SMatthew G. Knepley } 1560b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15613d3eaba7SBarry Smith ii = a->i; 1562b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1563b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1564b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1565fff043a9SJunchao Zhang aa = a_a + ii[i]; 1566b434eb95SMatthew G. Knepley sum = 0.0; 1567b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1568b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1569b434eb95SMatthew G. Knepley y[i] = sum; 1570b434eb95SMatthew G. Knepley } 1571b434eb95SMatthew G. Knepley } 15729566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15739566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15749566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1577b434eb95SMatthew G. Knepley } 1578b434eb95SMatthew G. Knepley 1579ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1580ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1581d71ae5a4SJacob Faibussowitsch { 1582b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1583b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1584b434eb95SMatthew G. Knepley const PetscScalar *x; 1585fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1586b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1587b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1588b434eb95SMatthew G. Knepley PetscScalar sum; 1589b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1590b434eb95SMatthew G. Knepley 1591b434eb95SMatthew G. Knepley PetscFunctionBegin; 15929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15939566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15949566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1595b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 159648a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1597b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1598b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1599b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1600b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1601b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1602b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1603fff043a9SJunchao Zhang aa = a_a + ii[i]; 1604b434eb95SMatthew G. Knepley sum = y[*ridx]; 1605b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1606b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1607b434eb95SMatthew G. Knepley } 1608b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16093d3eaba7SBarry Smith ii = a->i; 1610b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1611b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1612b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1613fff043a9SJunchao Zhang aa = a_a + ii[i]; 1614b434eb95SMatthew G. Knepley sum = y[i]; 1615b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1616b434eb95SMatthew G. Knepley z[i] = sum; 1617b434eb95SMatthew G. Knepley } 1618b434eb95SMatthew G. Knepley } 16199566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16209566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16219566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1624b434eb95SMatthew G. Knepley } 1625b434eb95SMatthew G. Knepley 1626c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1627d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1628d71ae5a4SJacob Faibussowitsch { 1629416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1630f15663dcSBarry Smith PetscScalar *y, *z; 1631f15663dcSBarry Smith const PetscScalar *x; 1632fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1633d9ca1df4SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 1634d9ca1df4SBarry Smith PetscInt m = A->rmap->n, n, i; 1635362ced78SSatish Balay PetscScalar sum; 1636ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16379ea0dfa2SSatish Balay 16383a40ed3dSBarry Smith PetscFunctionBegin; 1639b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16409566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 16413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1642b215bc84SStefano Zampini } 16439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16449566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16459566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16464eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 164748a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 164897952fefSHong Zhang m = a->compressedrow.nrows; 164997952fefSHong Zhang ii = a->compressedrow.i; 165097952fefSHong Zhang ridx = a->compressedrow.rindex; 165197952fefSHong Zhang for (i = 0; i < m; i++) { 165297952fefSHong Zhang n = ii[i + 1] - ii[i]; 165397952fefSHong Zhang aj = a->j + ii[i]; 1654fff043a9SJunchao Zhang aa = a_a + ii[i]; 165597952fefSHong Zhang sum = y[*ridx]; 1656f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165797952fefSHong Zhang z[*ridx++] = sum; 165897952fefSHong Zhang } 165997952fefSHong Zhang } else { /* do not use compressed row format */ 16603d3eaba7SBarry Smith ii = a->i; 1661f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16623d3eaba7SBarry Smith aj = a->j; 1663fff043a9SJunchao Zhang aa = a_a; 1664f15663dcSBarry Smith fortranmultaddaij_(&m, x, ii, aj, aa, y, z); 1665f15663dcSBarry Smith #else 166617ab2063SBarry Smith for (i = 0; i < m; i++) { 1667f15663dcSBarry Smith n = ii[i + 1] - ii[i]; 1668f15663dcSBarry Smith aj = a->j + ii[i]; 1669fff043a9SJunchao Zhang aa = a_a + ii[i]; 167017ab2063SBarry Smith sum = y[i]; 1671f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 167217ab2063SBarry Smith z[i] = sum; 167317ab2063SBarry Smith } 167402ab625aSSatish Balay #endif 1675f15663dcSBarry Smith } 16769566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16779566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16789566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 168117ab2063SBarry Smith } 168217ab2063SBarry Smith 168317ab2063SBarry Smith /* 168417ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 168517ab2063SBarry Smith */ 1686d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1687d71ae5a4SJacob Faibussowitsch { 1688416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1689d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1690c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 169117ab2063SBarry Smith 16923a40ed3dSBarry Smith PetscFunctionBegin; 169309f38230SBarry Smith if (!a->diag) { 16949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1695c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 169609f38230SBarry Smith } 1697d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1698c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1699c0c07093SJunchao Zhang if (alreadySet) { 1700c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1701c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1702c0c07093SJunchao Zhang } 1703c0c07093SJunchao Zhang 170409f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1705bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1706bfeeae90SHong Zhang if (a->j[j] == i) { 170709f38230SBarry Smith a->diag[i] = j; 170817ab2063SBarry Smith break; 170917ab2063SBarry Smith } 171017ab2063SBarry Smith } 171117ab2063SBarry Smith } 17123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 171317ab2063SBarry Smith } 171417ab2063SBarry Smith 1715ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1716d71ae5a4SJacob Faibussowitsch { 171761ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 171861ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 171961ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 172061ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 172161ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 172261ecd0c6SBarry Smith 172361ecd0c6SBarry Smith PetscFunctionBegin; 172461ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17269566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 17273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 172861ecd0c6SBarry Smith } 172961ecd0c6SBarry Smith 173061ecd0c6SBarry Smith if (a->diagonaldense) { 173161ecd0c6SBarry Smith cnt = 0; 173261ecd0c6SBarry Smith } else { 17339566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 173461ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1735349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 173661ecd0c6SBarry Smith cnt++; 173761ecd0c6SBarry Smith mdiag[i] = 1; 173861ecd0c6SBarry Smith } 173961ecd0c6SBarry Smith } 174061ecd0c6SBarry Smith } 174161ecd0c6SBarry Smith if (!cnt) { 17429566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 174361ecd0c6SBarry Smith } else { 1744b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1745b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 174661ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij; 17476ea2a7edSJunchao Zhang const PetscScalar *Aa; 17486ea2a7edSJunchao Zhang 17496ea2a7edSJunchao Zhang PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host 17506ea2a7edSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa)); 175161ecd0c6SBarry Smith 175261ecd0c6SBarry Smith a->a = NULL; 175361ecd0c6SBarry Smith a->j = NULL; 175461ecd0c6SBarry Smith a->i = NULL; 175561ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1756ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 175861ecd0c6SBarry Smith 175961ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 176061ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17619566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 176248a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1763447d62f5SStefano Zampini } 17649566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17659566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 176661ecd0c6SBarry Smith if (singlemalloc) { 17679566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda, oldj, oldi)); 176861ecd0c6SBarry Smith } else { 17699566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17709566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17719566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 177261ecd0c6SBarry Smith } 177361ecd0c6SBarry Smith } 17749566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 177561ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 17763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 177761ecd0c6SBarry Smith } 177861ecd0c6SBarry Smith 1779be5855fcSBarry Smith /* 1780be5855fcSBarry Smith Checks for missing diagonals 1781be5855fcSBarry Smith */ 1782d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1783d71ae5a4SJacob Faibussowitsch { 1784be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17857734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1786be5855fcSBarry Smith 1787be5855fcSBarry Smith PetscFunctionBegin; 178809f38230SBarry Smith *missing = PETSC_FALSE; 17897734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 179009f38230SBarry Smith *missing = PETSC_TRUE; 179109f38230SBarry Smith if (d) *d = 0; 17929566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 179309f38230SBarry Smith } else { 179401445905SHong Zhang PetscInt n; 179501445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1796f1e2ffcdSBarry Smith diag = a->diag; 179701445905SHong Zhang for (i = 0; i < n; i++) { 17987734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 179909f38230SBarry Smith *missing = PETSC_TRUE; 180009f38230SBarry Smith if (d) *d = i; 18019566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1802358d2f5dSShri Abhyankar break; 180309f38230SBarry Smith } 1804be5855fcSBarry Smith } 1805be5855fcSBarry Smith } 18063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1807be5855fcSBarry Smith } 1808be5855fcSBarry Smith 18090da83c2eSBarry Smith #include <petscblaslapack.h> 18100da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18110da83c2eSBarry Smith 18120da83c2eSBarry Smith /* 18130da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18140da83c2eSBarry Smith */ 1815ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1816d71ae5a4SJacob Faibussowitsch { 18170da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18180da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18190da83c2eSBarry Smith const PetscReal shift = 0.0; 18200da83c2eSBarry Smith PetscInt ipvt[5]; 18214e208921SJed Brown PetscCount flops = 0; 18220da83c2eSBarry Smith PetscScalar work[25], *v_work; 18230da83c2eSBarry Smith 18240da83c2eSBarry Smith PetscFunctionBegin; 18250da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18260da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 182708401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1828ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18299566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 183048a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18310da83c2eSBarry Smith ncnt = 0; 18320da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18330da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18349566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18350da83c2eSBarry Smith switch (bsizes[i]) { 1836d71ae5a4SJacob Faibussowitsch case 1: 1837d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1838d71ae5a4SJacob Faibussowitsch break; 18390da83c2eSBarry Smith case 2: 18409566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18410da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18429566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18430da83c2eSBarry Smith break; 18440da83c2eSBarry Smith case 3: 18459566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18460da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18480da83c2eSBarry Smith break; 18490da83c2eSBarry Smith case 4: 18509566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18510da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18529566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18530da83c2eSBarry Smith break; 18540da83c2eSBarry Smith case 5: 18559566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18560da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18579566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18580da83c2eSBarry Smith break; 18590da83c2eSBarry Smith case 6: 18609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18610da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18630da83c2eSBarry Smith break; 18640da83c2eSBarry Smith case 7: 18659566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18660da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18679566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18680da83c2eSBarry Smith break; 18690da83c2eSBarry Smith default: 18709566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18710da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18729566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18730da83c2eSBarry Smith } 18740da83c2eSBarry Smith ncnt += bsizes[i]; 18750da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 18764e208921SJed Brown flops += 2 * PetscPowInt(bsizes[i], 3) / 3; 18770da83c2eSBarry Smith } 18783ba16761SJacob Faibussowitsch PetscCall(PetscLogFlops(flops)); 187948a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18809566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18820da83c2eSBarry Smith } 18830da83c2eSBarry Smith 1884422a814eSBarry Smith /* 1885422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1886422a814eSBarry Smith */ 1887ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1888d71ae5a4SJacob Faibussowitsch { 188971f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1890d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18912e5835c6SStefano Zampini const MatScalar *v; 189254f21887SBarry Smith PetscScalar *idiag, *mdiag; 189371f1c65dSBarry Smith 189471f1c65dSBarry Smith PetscFunctionBegin; 18953ba16761SJacob Faibussowitsch if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS); 18969566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 189771f1c65dSBarry Smith diag = a->diag; 18984dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18992e5835c6SStefano Zampini 190071f1c65dSBarry Smith mdiag = a->mdiag; 190171f1c65dSBarry Smith idiag = a->idiag; 19029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1903422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 190471f1c65dSBarry Smith for (i = 0; i < m; i++) { 190571f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1906899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1907899639b0SHong Zhang if (PetscRealPart(fshift)) { 19089566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 19097b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 19107b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19117b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 191298921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1913899639b0SHong Zhang } 191471f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 191571f1c65dSBarry Smith } 19169566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 191771f1c65dSBarry Smith } else { 191871f1c65dSBarry Smith for (i = 0; i < m; i++) { 191971f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 192071f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 192171f1c65dSBarry Smith } 19229566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 192371f1c65dSBarry Smith } 192471f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 19263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 192771f1c65dSBarry Smith } 192871f1c65dSBarry Smith 1929d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1930d71ae5a4SJacob Faibussowitsch { 1931416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1932e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19332e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 193454f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19353d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 193697f1f81fSBarry Smith const PetscInt *idx, *diag; 193717ab2063SBarry Smith 19383a40ed3dSBarry Smith PetscFunctionBegin; 1939b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19409566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 19413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1942b215bc84SStefano Zampini } 1943b965ef7fSBarry Smith its = its * lits; 194491723122SBarry Smith 194571f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19469566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 194771f1c65dSBarry Smith a->fshift = fshift; 194871f1c65dSBarry Smith a->omega = omega; 1949ed480e8bSBarry Smith 195071f1c65dSBarry Smith diag = a->diag; 195171f1c65dSBarry Smith t = a->ssor_work; 1952ed480e8bSBarry Smith idiag = a->idiag; 195371f1c65dSBarry Smith mdiag = a->mdiag; 1954ed480e8bSBarry Smith 19559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19569566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19579566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1958ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 195917ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 196017ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1961ed480e8bSBarry Smith bs = b; 196217ab2063SBarry Smith for (i = 0; i < m; i++) { 196371f1c65dSBarry Smith d = fshift + mdiag[i]; 1964416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1965ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19662e5835c6SStefano Zampini v = aa + diag[i] + 1; 196717ab2063SBarry Smith sum = b[i] * d / omega; 1968003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 196917ab2063SBarry Smith x[i] = sum; 197017ab2063SBarry Smith } 19719566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19729566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19749566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 197617ab2063SBarry Smith } 1977c783ea89SBarry Smith 197808401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1979f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19804c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1981887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 198217ab2063SBarry Smith 198317ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 198417ab2063SBarry Smith 1985887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 198617ab2063SBarry Smith */ 198717ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 198817ab2063SBarry Smith 198917ab2063SBarry Smith /* x = (E + U)^{-1} b */ 199017ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1991416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1992ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19932e5835c6SStefano Zampini v = aa + diag[i] + 1; 199417ab2063SBarry Smith sum = b[i]; 1995e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1996ed480e8bSBarry Smith x[i] = sum * idiag[i]; 199717ab2063SBarry Smith } 199817ab2063SBarry Smith 199917ab2063SBarry Smith /* t = b - (2*E - D)x */ 20002e5835c6SStefano Zampini v = aa; 20012205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 200217ab2063SBarry Smith 200317ab2063SBarry Smith /* t = (E + L)^{-1}t */ 2004ed480e8bSBarry Smith ts = t; 2005416022c9SBarry Smith diag = a->diag; 200617ab2063SBarry Smith for (i = 0; i < m; i++) { 2007416022c9SBarry Smith n = diag[i] - a->i[i]; 2008ed480e8bSBarry Smith idx = a->j + a->i[i]; 20092e5835c6SStefano Zampini v = aa + a->i[i]; 201017ab2063SBarry Smith sum = t[i]; 2011003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 2012ed480e8bSBarry Smith t[i] = sum * idiag[i]; 2013733d66baSBarry Smith /* x = x + t */ 2014733d66baSBarry Smith x[i] += t[i]; 201517ab2063SBarry Smith } 201617ab2063SBarry Smith 20179566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20189566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 202117ab2063SBarry Smith } 202217ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 202317ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 202417ab2063SBarry Smith for (i = 0; i < m; i++) { 2025416022c9SBarry Smith n = diag[i] - a->i[i]; 2026ed480e8bSBarry Smith idx = a->j + a->i[i]; 20272e5835c6SStefano Zampini v = aa + a->i[i]; 202817ab2063SBarry Smith sum = b[i]; 2029e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20305c99c7daSBarry Smith t[i] = sum; 2031ed480e8bSBarry Smith x[i] = sum * idiag[i]; 203217ab2063SBarry Smith } 20335c99c7daSBarry Smith xb = t; 20349566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20353a40ed3dSBarry Smith } else xb = b; 203617ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 203717ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2038416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2039ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20402e5835c6SStefano Zampini v = aa + diag[i] + 1; 204117ab2063SBarry Smith sum = xb[i]; 2042e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20435c99c7daSBarry Smith if (xb == b) { 2044ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20455c99c7daSBarry Smith } else { 2046b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 204717ab2063SBarry Smith } 20485c99c7daSBarry Smith } 20499566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 205017ab2063SBarry Smith } 205117ab2063SBarry Smith its--; 205217ab2063SBarry Smith } 205317ab2063SBarry Smith while (its--) { 205417ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 205517ab2063SBarry Smith for (i = 0; i < m; i++) { 2056b19a5dc2SMark Adams /* lower */ 2057b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2058ed480e8bSBarry Smith idx = a->j + a->i[i]; 20592e5835c6SStefano Zampini v = aa + a->i[i]; 206017ab2063SBarry Smith sum = b[i]; 2061e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2062b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2063b19a5dc2SMark Adams /* upper */ 2064b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2065b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20662e5835c6SStefano Zampini v = aa + diag[i] + 1; 2067b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2068b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 206917ab2063SBarry Smith } 2070b19a5dc2SMark Adams xb = t; 20719566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2072b19a5dc2SMark Adams } else xb = b; 207317ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 207417ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2075b19a5dc2SMark Adams sum = xb[i]; 2076b19a5dc2SMark Adams if (xb == b) { 2077b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2078416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2079ed480e8bSBarry Smith idx = a->j + a->i[i]; 20802e5835c6SStefano Zampini v = aa + a->i[i]; 2081e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2082ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2083b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2084b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2085b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20862e5835c6SStefano Zampini v = aa + diag[i] + 1; 2087b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2088b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 208917ab2063SBarry Smith } 2090b19a5dc2SMark Adams } 2091b19a5dc2SMark Adams if (xb == b) { 20929566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2093b19a5dc2SMark Adams } else { 20949566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2095b19a5dc2SMark Adams } 209617ab2063SBarry Smith } 209717ab2063SBarry Smith } 20989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20999566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 21009566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 21013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 210217ab2063SBarry Smith } 210317ab2063SBarry Smith 2104ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2105d71ae5a4SJacob Faibussowitsch { 2106416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21074e220ebcSLois Curfman McInnes 21083a40ed3dSBarry Smith PetscFunctionBegin; 21094e220ebcSLois Curfman McInnes info->block_size = 1.0; 21103966268fSBarry Smith info->nz_allocated = a->maxnz; 21113966268fSBarry Smith info->nz_used = a->nz; 21123966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21133966268fSBarry Smith info->assemblies = A->num_ass; 21143966268fSBarry Smith info->mallocs = A->info.mallocs; 21154dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2116d5f3da31SBarry Smith if (A->factortype) { 21174e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21184e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21194e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21204e220ebcSLois Curfman McInnes } else { 21214e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21224e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21234e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21244e220ebcSLois Curfman McInnes } 21253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 212617ab2063SBarry Smith } 212717ab2063SBarry Smith 2128ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2129d71ae5a4SJacob Faibussowitsch { 2130416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2131c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 213297b48c8fSBarry Smith const PetscScalar *xx; 21332e5835c6SStefano Zampini PetscScalar *bb, *aa; 2134c7da8527SEric Chamberland PetscInt d = 0; 213517ab2063SBarry Smith 21363a40ed3dSBarry Smith PetscFunctionBegin; 213797b48c8fSBarry Smith if (x && b) { 21389566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21399566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 214097b48c8fSBarry Smith for (i = 0; i < N; i++) { 2141aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2142447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 214397b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 214497b48c8fSBarry Smith } 21459566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21469566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 214797b48c8fSBarry Smith } 214897b48c8fSBarry Smith 21499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2150a9817697SBarry Smith if (a->keepnonzeropattern) { 2151f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2152aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21539566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2154f1e2ffcdSBarry Smith } 2155f4df32b1SMatthew Knepley if (diag != 0.0) { 2156c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2157c7da8527SEric Chamberland d = rows[i]; 2158447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 215908401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2160c7da8527SEric Chamberland } 2161f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2162447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21632e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2164f1e2ffcdSBarry Smith } 2165f1e2ffcdSBarry Smith } 2166f1e2ffcdSBarry Smith } else { 2167f4df32b1SMatthew Knepley if (diag != 0.0) { 216817ab2063SBarry Smith for (i = 0; i < N; i++) { 2169aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21707ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2171447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2172447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2173447d62f5SStefano Zampini } else { 2174416022c9SBarry Smith a->ilen[rows[i]] = 1; 21752e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2176bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2177447d62f5SStefano Zampini } 2178447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21799566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 218017ab2063SBarry Smith } 218117ab2063SBarry Smith } 21823a40ed3dSBarry Smith } else { 218317ab2063SBarry Smith for (i = 0; i < N; i++) { 2184aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2185416022c9SBarry Smith a->ilen[rows[i]] = 0; 218617ab2063SBarry Smith } 218717ab2063SBarry Smith } 2188e56f5c9eSBarry Smith A->nonzerostate++; 2189f1e2ffcdSBarry Smith } 21909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2191dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 219317ab2063SBarry Smith } 219417ab2063SBarry Smith 2195ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2196d71ae5a4SJacob Faibussowitsch { 21976e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21986e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21992b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 22006e169961SBarry Smith const PetscScalar *xx; 22012e5835c6SStefano Zampini PetscScalar *bb, *aa; 22026e169961SBarry Smith 22036e169961SBarry Smith PetscFunctionBegin; 22043ba16761SJacob Faibussowitsch if (!N) PetscFunctionReturn(PETSC_SUCCESS); 22059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 22066e169961SBarry Smith if (x && b) { 22079566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 22089566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 22092b40b63fSBarry Smith vecs = PETSC_TRUE; 22106e169961SBarry Smith } 22119566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 22126e169961SBarry Smith for (i = 0; i < N; i++) { 2213aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 22148e3a54c0SPierre Jolivet PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]])); 22152205254eSKarl Rupp 22166e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22176e169961SBarry Smith } 22186e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22196e169961SBarry Smith if (!zeroed[i]) { 22206e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22214cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22222e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22232e5835c6SStefano Zampini aa[j] = 0.0; 22246e169961SBarry Smith } 22256e169961SBarry Smith } 22264cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22276e169961SBarry Smith } 22286e169961SBarry Smith if (x && b) { 22299566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22309566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22316e169961SBarry Smith } 22329566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22336e169961SBarry Smith if (diag != 0.0) { 22349566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22351d5a398dSstefano_zampini if (missing) { 22361d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22374cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2238aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22399566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22401d5a398dSstefano_zampini } 22411d5a398dSstefano_zampini } else { 2242ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22436e169961SBarry Smith } 22441d5a398dSstefano_zampini } 22459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2246dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22486e169961SBarry Smith } 22496e169961SBarry Smith 2250d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2251d71ae5a4SJacob Faibussowitsch { 2252fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2253fff043a9SJunchao Zhang const PetscScalar *aa; 225417ab2063SBarry Smith 22553a40ed3dSBarry Smith PetscFunctionBegin; 22569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2257416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22588e3a54c0SPierre Jolivet if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]); 225917ab2063SBarry Smith if (idx) { 22605c0db29aSPierre Jolivet if (*nz && a->j) *idx = a->j + a->i[row]; 2261f4259b30SLisandro Dalcin else *idx = NULL; 226217ab2063SBarry Smith } 22639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 226517ab2063SBarry Smith } 226617ab2063SBarry Smith 2267d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2268d71ae5a4SJacob Faibussowitsch { 22693a40ed3dSBarry Smith PetscFunctionBegin; 22703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 227117ab2063SBarry Smith } 227217ab2063SBarry Smith 2273ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2274d71ae5a4SJacob Faibussowitsch { 2275416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22762e5835c6SStefano Zampini const MatScalar *v; 227736db0b34SBarry Smith PetscReal sum = 0.0; 227897f1f81fSBarry Smith PetscInt i, j; 227917ab2063SBarry Smith 22803a40ed3dSBarry Smith PetscFunctionBegin; 22819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 228217ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2283570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2284570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2285792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2286570b7f6dSBarry Smith #else 2287416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22889371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22899371c9d4SSatish Balay v++; 229017ab2063SBarry Smith } 22918f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2292570b7f6dSBarry Smith #endif 22939566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22943a40ed3dSBarry Smith } else if (type == NORM_1) { 229536db0b34SBarry Smith PetscReal *tmp; 229697f1f81fSBarry Smith PetscInt *jj = a->j; 22979566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2298064f8208SBarry Smith *nrm = 0.0; 2299416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 23009371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 23019371c9d4SSatish Balay v++; 230217ab2063SBarry Smith } 2303d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2304064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 230517ab2063SBarry Smith } 23069566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 23079566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 23083a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2309064f8208SBarry Smith *nrm = 0.0; 2310d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 23118e3a54c0SPierre Jolivet const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]); 231217ab2063SBarry Smith sum = 0.0; 2313416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23149371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23159371c9d4SSatish Balay v2++; 231617ab2063SBarry Smith } 2317064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 231817ab2063SBarry Smith } 23199566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2320f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 232317ab2063SBarry Smith } 232417ab2063SBarry Smith 2325ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2326d71ae5a4SJacob Faibussowitsch { 23273d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 232854f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23292e5835c6SStefano Zampini const MatScalar *va, *vb; 233097f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2331cd0d46ebSvictorle 2332cd0d46ebSvictorle PetscFunctionBegin; 23339566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23349566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23355485867bSBarry Smith if (ma != nb || na != mb) { 23365485867bSBarry Smith *f = PETSC_FALSE; 23373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23385485867bSBarry Smith } 23399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23419371c9d4SSatish Balay aii = aij->i; 23429371c9d4SSatish Balay bii = bij->i; 23439371c9d4SSatish Balay adx = aij->j; 23449371c9d4SSatish Balay bdx = bij->j; 23459566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23469566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2347cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2348cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2349cd0d46ebSvictorle 2350cd0d46ebSvictorle *f = PETSC_TRUE; 2351cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2352cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 235397f1f81fSBarry Smith PetscInt idc, idr; 23545485867bSBarry Smith PetscScalar vc, vr; 2355cd0d46ebSvictorle /* column/row index/value */ 23565485867bSBarry Smith idc = adx[aptr[i]]; 23575485867bSBarry Smith idr = bdx[bptr[idc]]; 23585485867bSBarry Smith vc = va[aptr[i]]; 23595485867bSBarry Smith vr = vb[bptr[idc]]; 23605485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23615485867bSBarry Smith *f = PETSC_FALSE; 23625485867bSBarry Smith goto done; 2363cd0d46ebSvictorle } else { 23645485867bSBarry Smith aptr[i]++; 23655485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2366cd0d46ebSvictorle } 2367cd0d46ebSvictorle } 2368cd0d46ebSvictorle } 2369cd0d46ebSvictorle done: 23709566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23719566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 23743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2375cd0d46ebSvictorle } 2376cd0d46ebSvictorle 2377ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2378d71ae5a4SJacob Faibussowitsch { 23793d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 238054f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 238154f21887SBarry Smith MatScalar *va, *vb; 23821cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23831cbb95d3SBarry Smith 23841cbb95d3SBarry Smith PetscFunctionBegin; 23859566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23869566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23871cbb95d3SBarry Smith if (ma != nb || na != mb) { 23881cbb95d3SBarry Smith *f = PETSC_FALSE; 23893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23901cbb95d3SBarry Smith } 23919371c9d4SSatish Balay aii = aij->i; 23929371c9d4SSatish Balay bii = bij->i; 23939371c9d4SSatish Balay adx = aij->j; 23949371c9d4SSatish Balay bdx = bij->j; 23959371c9d4SSatish Balay va = aij->a; 23969371c9d4SSatish Balay vb = bij->a; 23979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23991cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 24001cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 24011cbb95d3SBarry Smith 24021cbb95d3SBarry Smith *f = PETSC_TRUE; 24031cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 24041cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 24051cbb95d3SBarry Smith PetscInt idc, idr; 24061cbb95d3SBarry Smith PetscScalar vc, vr; 24071cbb95d3SBarry Smith /* column/row index/value */ 24081cbb95d3SBarry Smith idc = adx[aptr[i]]; 24091cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24101cbb95d3SBarry Smith vc = va[aptr[i]]; 24111cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24121cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24131cbb95d3SBarry Smith *f = PETSC_FALSE; 24141cbb95d3SBarry Smith goto done; 24151cbb95d3SBarry Smith } else { 24161cbb95d3SBarry Smith aptr[i]++; 24171cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24181cbb95d3SBarry Smith } 24191cbb95d3SBarry Smith } 24201cbb95d3SBarry Smith } 24211cbb95d3SBarry Smith done: 24229566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24239566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24251cbb95d3SBarry Smith } 24261cbb95d3SBarry Smith 2427d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2428d71ae5a4SJacob Faibussowitsch { 2429416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2430fff8e43fSBarry Smith const PetscScalar *l, *r; 2431fff8e43fSBarry Smith PetscScalar x; 243254f21887SBarry Smith MatScalar *v; 2433fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2434fff8e43fSBarry Smith const PetscInt *jj; 243517ab2063SBarry Smith 24363a40ed3dSBarry Smith PetscFunctionBegin; 243717ab2063SBarry Smith if (ll) { 24383ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24393ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24409566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 244108401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24429566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 244417ab2063SBarry Smith for (i = 0; i < m; i++) { 244517ab2063SBarry Smith x = l[i]; 2446416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24472205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 244817ab2063SBarry Smith } 24499566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24509566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 245217ab2063SBarry Smith } 245317ab2063SBarry Smith if (rr) { 24549566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 245508401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24569566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24582e5835c6SStefano Zampini jj = a->j; 24592205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24619566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24629566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 246317ab2063SBarry Smith } 24649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 246617ab2063SBarry Smith } 246717ab2063SBarry Smith 2468d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2469d71ae5a4SJacob Faibussowitsch { 2470db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2471d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 247297f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24735d0c19d7SBarry Smith const PetscInt *irow, *icol; 24742e5835c6SStefano Zampini const PetscScalar *aa; 24755d0c19d7SBarry Smith PetscInt nrows, ncols; 247697f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 2477fb3c7e2dSJunchao Zhang MatScalar *a_new, *mat_a, *c_a; 2478416022c9SBarry Smith Mat C; 2479cdc6f3adSToby Isaac PetscBool stride; 248017ab2063SBarry Smith 24813a40ed3dSBarry Smith PetscFunctionBegin; 24829566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24839566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24849566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 248517ab2063SBarry Smith 24869566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2487ff718158SBarry Smith if (stride) { 24889566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2489ff718158SBarry Smith } else { 2490ff718158SBarry Smith first = 0; 2491ff718158SBarry Smith step = 0; 2492ff718158SBarry Smith } 2493fee21e36SBarry Smith if (stride && step == 1) { 249402834360SBarry Smith /* special case of contiguous rows */ 24959566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 249602834360SBarry Smith /* loop over new rows determining lens and starting points */ 249702834360SBarry Smith for (i = 0; i < nrows; i++) { 2498bfeeae90SHong Zhang kstart = ai[irow[i]]; 2499a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2500a91a9bebSLisandro Dalcin starts[i] = kstart; 250102834360SBarry Smith for (k = kstart; k < kend; k++) { 2502bfeeae90SHong Zhang if (aj[k] >= first) { 250302834360SBarry Smith starts[i] = k; 250402834360SBarry Smith break; 250502834360SBarry Smith } 250602834360SBarry Smith } 2507a2744918SBarry Smith sum = 0; 250802834360SBarry Smith while (k < kend) { 2509bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2510a2744918SBarry Smith sum++; 251102834360SBarry Smith } 2512a2744918SBarry Smith lens[i] = sum; 251302834360SBarry Smith } 251402834360SBarry Smith /* create submatrix */ 2515cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 251697f1f81fSBarry Smith PetscInt n_cols, n_rows; 25179566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2518aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25199566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 252008480c60SBarry Smith C = *B; 25213a40ed3dSBarry Smith } else { 25223bef6203SJed Brown PetscInt rbs, cbs; 25239566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25249566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25259566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25269566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25279566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25289566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 253008480c60SBarry Smith } 2531db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2532db02288aSLois Curfman McInnes 253302834360SBarry Smith /* loop over rows inserting into submatrix */ 2534fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C 2535db02288aSLois Curfman McInnes j_new = c->j; 2536db02288aSLois Curfman McInnes i_new = c->i; 25379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 253802834360SBarry Smith for (i = 0; i < nrows; i++) { 2539a2744918SBarry Smith ii = starts[i]; 2540a2744918SBarry Smith lensi = lens[i]; 2541810441c8SPierre Jolivet if (lensi) { 2542ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2544a2744918SBarry Smith a_new += lensi; 2545810441c8SPierre Jolivet } 2546a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2547a2744918SBarry Smith c->ilen[i] = lensi; 254802834360SBarry Smith } 2549fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly 25509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25519566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25523a40ed3dSBarry Smith } else { 25539566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25549566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25559566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25564dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25576bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25584dcab191SBarry Smith smap[icol[i]] = i + 1; 25594dcab191SBarry Smith } 25604dcab191SBarry Smith 256102834360SBarry Smith /* determine lens of each row */ 256202834360SBarry Smith for (i = 0; i < nrows; i++) { 2563bfeeae90SHong Zhang kstart = ai[irow[i]]; 256402834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 256502834360SBarry Smith lens[i] = 0; 256602834360SBarry Smith for (k = kstart; k < kend; k++) { 2567ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 256802834360SBarry Smith } 256902834360SBarry Smith } 257017ab2063SBarry Smith /* Create and fill new matrix */ 2571a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2572ace3abfcSBarry Smith PetscBool equal; 25730f5bd95cSBarry Smith 257499141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2575aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25769566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 2577fdfbdca6SPierre Jolivet PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros"); 25789566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 257908480c60SBarry Smith C = *B; 25803a40ed3dSBarry Smith } else { 25813bef6203SJed Brown PetscInt rbs, cbs; 25829566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25839566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25849566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25859566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 258637a5e0faSPierre Jolivet if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25879566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 258908480c60SBarry Smith } 25909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2591fb3c7e2dSJunchao Zhang 2592f4f49eeaSPierre Jolivet c = (Mat_SeqAIJ *)C->data; 2593fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C 259417ab2063SBarry Smith for (i = 0; i < nrows; i++) { 259599141d43SSatish Balay row = irow[i]; 2596bfeeae90SHong Zhang kstart = ai[row]; 259799141d43SSatish Balay kend = kstart + a->ilen[row]; 2598bfeeae90SHong Zhang mat_i = c->i[i]; 25998e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 26008e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 260199141d43SSatish Balay mat_ilen = c->ilen + i; 260217ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2603bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2604ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26052e5835c6SStefano Zampini *mat_a++ = aa[k]; 260699141d43SSatish Balay (*mat_ilen)++; 260717ab2063SBarry Smith } 260817ab2063SBarry Smith } 260917ab2063SBarry Smith } 26109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 261102834360SBarry Smith /* Free work space */ 26129566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26139566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26149566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2615cdc6f3adSToby Isaac /* sort */ 2616cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2617cdc6f3adSToby Isaac PetscInt ilen; 2618cdc6f3adSToby Isaac 2619cdc6f3adSToby Isaac mat_i = c->i[i]; 26208e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 26218e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 2622cdc6f3adSToby Isaac ilen = c->ilen[i]; 26239566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2624cdc6f3adSToby Isaac } 2625fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a)); 262602834360SBarry Smith } 26278c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26289566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2629305c6ccfSStefano Zampini #endif 26309566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26319566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 263217ab2063SBarry Smith 26339566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2634416022c9SBarry Smith *B = C; 26353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 263617ab2063SBarry Smith } 263717ab2063SBarry Smith 2638ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2639d71ae5a4SJacob Faibussowitsch { 264082d44351SHong Zhang Mat B; 264182d44351SHong Zhang 264282d44351SHong Zhang PetscFunctionBegin; 2643c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26449566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26459566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26469566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26479566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26489566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 264982d44351SHong Zhang *subMat = B; 2650c2d650bdSHong Zhang } else { 26519566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2652c2d650bdSHong Zhang } 26533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 265482d44351SHong Zhang } 265582d44351SHong Zhang 2656ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2657d71ae5a4SJacob Faibussowitsch { 265863b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 265963b91edcSBarry Smith Mat outA; 2660ace3abfcSBarry Smith PetscBool row_identity, col_identity; 266163b91edcSBarry Smith 26623a40ed3dSBarry Smith PetscFunctionBegin; 266308401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26641df811f5SHong Zhang 26659566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26669566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2667a871dcd8SBarry Smith 266863b91edcSBarry Smith outA = inA; 2669d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26709566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26719566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26722205254eSKarl Rupp 26739566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26749566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26752205254eSKarl Rupp 2676c3122656SLisandro Dalcin a->row = row; 26772205254eSKarl Rupp 26789566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26799566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26802205254eSKarl Rupp 2681c3122656SLisandro Dalcin a->col = col; 268263b91edcSBarry Smith 268336db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26849566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26859566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2686f0ec6fceSSatish Balay 268794a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26889566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 268994a9d846SBarry Smith } 269063b91edcSBarry Smith 26919566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2692137fb511SHong Zhang if (row_identity && col_identity) { 26939566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2694137fb511SHong Zhang } else { 26959566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2696137fb511SHong Zhang } 26973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2698a871dcd8SBarry Smith } 2699a871dcd8SBarry Smith 2700d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2701d71ae5a4SJacob Faibussowitsch { 2702f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2703dfa0f9e5SStefano Zampini PetscScalar *v; 2704c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 27053a40ed3dSBarry Smith 27063a40ed3dSBarry Smith PetscFunctionBegin; 27079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27089566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2709792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27109566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2714f0b747eeSBarry Smith } 2715f0b747eeSBarry Smith 2716d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2717d71ae5a4SJacob Faibussowitsch { 271816b64355SHong Zhang PetscInt i; 271916b64355SHong Zhang 272016b64355SHong Zhang PetscFunctionBegin; 272116b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27229566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 272316b64355SHong Zhang 272448a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27259566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 272616b64355SHong Zhang 272716b64355SHong Zhang if (submatj->rbuf1) { 27289566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27299566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 273016b64355SHong Zhang } 273116b64355SHong Zhang 273248a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27339566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27349566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 273516b64355SHong Zhang } 273616b64355SHong Zhang 273716b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2738eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 27399566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27409566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 274116b64355SHong Zhang #else 27429566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 274316b64355SHong Zhang #endif 274416b64355SHong Zhang 274516b64355SHong Zhang if (!submatj->allcolumns) { 274616b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2747eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap)); 274816b64355SHong Zhang #else 27499566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 275016b64355SHong Zhang #endif 275116b64355SHong Zhang } 27529566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 275316b64355SHong Zhang 27549566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 27553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 275616b64355SHong Zhang } 275716b64355SHong Zhang 2758d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2759d71ae5a4SJacob Faibussowitsch { 276016b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27615c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 276216b64355SHong Zhang 276316b64355SHong Zhang PetscFunctionBegin; 27649566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27659566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 276716b64355SHong Zhang } 276816b64355SHong Zhang 276989a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2770ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2771d71ae5a4SJacob Faibussowitsch { 27722d033e1fSHong Zhang PetscInt i; 27730fb991dcSHong Zhang Mat C; 27740fb991dcSHong Zhang Mat_SeqAIJ *c; 27750fb991dcSHong Zhang Mat_SubSppt *submatj; 27762d033e1fSHong Zhang 27772d033e1fSHong Zhang PetscFunctionBegin; 27782d033e1fSHong Zhang for (i = 0; i < n; i++) { 27790fb991dcSHong Zhang C = (*mat)[i]; 27800fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27810fb991dcSHong Zhang submatj = c->submatis1; 27822d033e1fSHong Zhang if (submatj) { 2783682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 278426cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27859566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27869566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27879566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27883faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27899566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27909566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27919566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2792682e4c99SStefano Zampini } 27932d033e1fSHong Zhang } else { 27949566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 27952d033e1fSHong Zhang } 27962d033e1fSHong Zhang } 279786e85357SHong Zhang 279863a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 27999566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 280063a75b2aSHong Zhang 28019566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 28023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28032d033e1fSHong Zhang } 28042d033e1fSHong Zhang 2805ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2806d71ae5a4SJacob Faibussowitsch { 280797f1f81fSBarry Smith PetscInt i; 2808cddf8d76SBarry Smith 28093a40ed3dSBarry Smith PetscFunctionBegin; 281048a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2811cddf8d76SBarry Smith 281248a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2814cddf8d76SBarry Smith } 2815cddf8d76SBarry Smith 2816ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2817d71ae5a4SJacob Faibussowitsch { 2818e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28199a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28205d0c19d7SBarry Smith const PetscInt *idx; 28219a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2822f1af5d2fSBarry Smith PetscBT table; 2823bbd702dbSSatish Balay 28243a40ed3dSBarry Smith PetscFunctionBegin; 28259a88ca10SBarry Smith m = A->rmap->n / bs; 2826e4d965acSSatish Balay ai = a->i; 2827bfeeae90SHong Zhang aj = a->j; 28288a047759SSatish Balay 282908401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 283006763907SSatish Balay 28319566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28329566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 283306763907SSatish Balay 2834e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2835b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2836e4d965acSSatish Balay isz = 0; 28379566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2838e4d965acSSatish Balay 2839e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28409566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28419566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2842e4d965acSSatish Balay 28439a88ca10SBarry Smith if (bs > 1) { 28449a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28459a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28469a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28479a88ca10SBarry Smith } 28489a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28499a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28509a88ca10SBarry Smith 28519a88ca10SBarry Smith k = 0; 28529a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28539a88ca10SBarry Smith n = isz; 28549a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28559a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28569a88ca10SBarry Smith row = bs * nidx[k] + ll; 28579a88ca10SBarry Smith start = ai[row]; 28589a88ca10SBarry Smith end = ai[row + 1]; 28599a88ca10SBarry Smith for (l = start; l < end; l++) { 28609a88ca10SBarry Smith val = aj[l] / bs; 28619a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28629a88ca10SBarry Smith } 28639a88ca10SBarry Smith } 28649a88ca10SBarry Smith } 28659a88ca10SBarry Smith } 28669a88ca10SBarry Smith PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i))); 28679a88ca10SBarry Smith } else { 2868dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2869e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28702205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28714dcbc457SBarry Smith } 28729566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28739566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2874e4d965acSSatish Balay 287504a348a9SBarry Smith k = 0; 287604a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 287704a348a9SBarry Smith n = isz; 287806763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2879e4d965acSSatish Balay row = nidx[k]; 2880e4d965acSSatish Balay start = ai[row]; 2881e4d965acSSatish Balay end = ai[row + 1]; 288204a348a9SBarry Smith for (l = start; l < end; l++) { 2883efb16452SHong Zhang val = aj[l]; 28842205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2885e4d965acSSatish Balay } 2886e4d965acSSatish Balay } 2887e4d965acSSatish Balay } 28889566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2889e4d965acSSatish Balay } 28909a88ca10SBarry Smith } 28919566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28929566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28944dcbc457SBarry Smith } 289517ab2063SBarry Smith 2896ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2897d71ae5a4SJacob Faibussowitsch { 28980513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28993b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 29005d0c19d7SBarry Smith const PetscInt *row, *col; 29015d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 290256cd22aeSBarry Smith IS icolp, irowp; 29030298fd71SBarry Smith PetscInt *cwork = NULL; 29040298fd71SBarry Smith PetscScalar *vwork = NULL; 29050513a670SBarry Smith 29063a40ed3dSBarry Smith PetscFunctionBegin; 29079566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29089566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29099566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29109566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29110513a670SBarry Smith 29120513a670SBarry Smith /* determine lengths of permuted rows */ 29139566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29142205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29159566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29169566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29179566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29189566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29209566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29210513a670SBarry Smith 29229566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29230513a670SBarry Smith for (i = 0; i < m; i++) { 29249566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29252205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29269566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29279566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29280513a670SBarry Smith } 29299566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29302205254eSKarl Rupp 29313c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29322205254eSKarl Rupp 29338c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29349566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29359fe5e383SStefano Zampini #endif 29369566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29379566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29389566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29399566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29409566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29419566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 294248a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29440513a670SBarry Smith } 29450513a670SBarry Smith 2946d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2947d71ae5a4SJacob Faibussowitsch { 2948cb5b572fSBarry Smith PetscFunctionBegin; 294933f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 295033f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2951be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2952be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29532e5835c6SStefano Zampini const PetscScalar *aa; 2954be6bf707SBarry Smith 29559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 295608401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29579566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29589566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2960cb5b572fSBarry Smith } else { 29619566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2962cb5b572fSBarry Smith } 29633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2964cb5b572fSBarry Smith } 2965cb5b572fSBarry Smith 2966d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2967d71ae5a4SJacob Faibussowitsch { 29686c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29696e111a19SKarl Rupp 29706c0721eeSBarry Smith PetscFunctionBegin; 29716c0721eeSBarry Smith *array = a->a; 29723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29736c0721eeSBarry Smith } 29746c0721eeSBarry Smith 2975d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2976d71ae5a4SJacob Faibussowitsch { 29776c0721eeSBarry Smith PetscFunctionBegin; 2978f38c1e66SStefano Zampini *array = NULL; 29793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29806c0721eeSBarry Smith } 2981273d9f13SBarry Smith 29828229c054SShri Abhyankar /* 29838229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29848229c054SShri Abhyankar have different nonzero structure. 29858229c054SShri Abhyankar */ 2986d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2987d71ae5a4SJacob Faibussowitsch { 2988b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2989ec7775f6SShri Abhyankar 2990ec7775f6SShri Abhyankar PetscFunctionBegin; 2991ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2992ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 29938e3a54c0SPierre Jolivet const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]); 2994b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 2995b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 29968af7cee1SJed Brown nnz[i] = 0; 29978af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 2998b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 2999b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 30008af7cee1SJed Brown nnz[i]++; 30018af7cee1SJed Brown } 30028af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 3003ec7775f6SShri Abhyankar } 30043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3005ec7775f6SShri Abhyankar } 3006ec7775f6SShri Abhyankar 3007d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3008d71ae5a4SJacob Faibussowitsch { 3009b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3010b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3011b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3012b264fe52SHong Zhang 3013b264fe52SHong Zhang PetscFunctionBegin; 3014b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30159566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 30163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3017b264fe52SHong Zhang } 3018b264fe52SHong Zhang 3019d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3020d71ae5a4SJacob Faibussowitsch { 3021ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3022ac90fabeSBarry Smith 3023ac90fabeSBarry Smith PetscFunctionBegin; 3024134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3025134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3026134adf20SPierre Jolivet if (e) { 30279566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 302881fa06acSBarry Smith if (e) { 30299566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3030134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 303181fa06acSBarry Smith } 303281fa06acSBarry Smith } 303354c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 303481fa06acSBarry Smith } 3035ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30362e5835c6SStefano Zampini const PetscScalar *xa; 30372e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 303881fa06acSBarry Smith PetscBLASInt one = 1, bnz; 303981fa06acSBarry Smith 30409566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3043792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30469566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30489566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3049ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30509566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3051ac90fabeSBarry Smith } else { 30528229c054SShri Abhyankar Mat B; 30538229c054SShri Abhyankar PetscInt *nnz; 30549566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30559566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30569566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30579566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30589566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30599566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30619566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30629566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30639bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30649566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3065ac90fabeSBarry Smith } 30663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3067ac90fabeSBarry Smith } 3068ac90fabeSBarry Smith 3069d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3070d71ae5a4SJacob Faibussowitsch { 3071354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3072354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3073354c94deSBarry Smith PetscInt i, nz; 3074354c94deSBarry Smith PetscScalar *a; 3075354c94deSBarry Smith 3076354c94deSBarry Smith PetscFunctionBegin; 3077354c94deSBarry Smith nz = aij->nz; 30789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30792205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3081354c94deSBarry Smith #else 3082354c94deSBarry Smith PetscFunctionBegin; 3083354c94deSBarry Smith #endif 30843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3085354c94deSBarry Smith } 3086354c94deSBarry Smith 3087ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3088d71ae5a4SJacob Faibussowitsch { 3089e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3090d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3091e34fafa9SBarry Smith PetscReal atmp; 3092985db425SBarry Smith PetscScalar *x; 3093ce496241SStefano Zampini const MatScalar *aa, *av; 3094e34fafa9SBarry Smith 3095e34fafa9SBarry Smith PetscFunctionBegin; 309628b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 30979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3098ce496241SStefano Zampini aa = av; 3099e34fafa9SBarry Smith ai = a->i; 3100e34fafa9SBarry Smith aj = a->j; 3101e34fafa9SBarry Smith 31029566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31039566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31049566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 310508401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3106e34fafa9SBarry Smith for (i = 0; i < m; i++) { 31079371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31089371c9d4SSatish Balay ai++; 3109e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3110985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31119371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31129371c9d4SSatish Balay x[i] = atmp; 31139371c9d4SSatish Balay if (idx) idx[i] = *aj; 31149371c9d4SSatish Balay } 31159371c9d4SSatish Balay aa++; 31169371c9d4SSatish Balay aj++; 3117985db425SBarry Smith } 3118985db425SBarry Smith } 31199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3122985db425SBarry Smith } 3123985db425SBarry Smith 3124eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v) 3125eede4a3fSMark Adams { 3126eede4a3fSMark Adams Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3127eede4a3fSMark Adams PetscInt i, j, m = A->rmap->n, *ai, ncols, n; 3128eede4a3fSMark Adams PetscScalar *x; 3129eede4a3fSMark Adams const MatScalar *aa, *av; 3130eede4a3fSMark Adams 3131eede4a3fSMark Adams PetscFunctionBegin; 3132eede4a3fSMark Adams PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3133eede4a3fSMark Adams PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3134eede4a3fSMark Adams aa = av; 3135eede4a3fSMark Adams ai = a->i; 3136eede4a3fSMark Adams 3137eede4a3fSMark Adams PetscCall(VecSet(v, 0.0)); 3138eede4a3fSMark Adams PetscCall(VecGetArrayWrite(v, &x)); 3139eede4a3fSMark Adams PetscCall(VecGetLocalSize(v, &n)); 3140eede4a3fSMark Adams PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3141eede4a3fSMark Adams for (i = 0; i < m; i++) { 3142eede4a3fSMark Adams ncols = ai[1] - ai[0]; 3143eede4a3fSMark Adams ai++; 3144eede4a3fSMark Adams for (j = 0; j < ncols; j++) { 3145eede4a3fSMark Adams x[i] += PetscAbsScalar(*aa); 3146eede4a3fSMark Adams aa++; 3147eede4a3fSMark Adams } 3148eede4a3fSMark Adams } 3149eede4a3fSMark Adams PetscCall(VecRestoreArrayWrite(v, &x)); 3150eede4a3fSMark Adams PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3151eede4a3fSMark Adams PetscFunctionReturn(PETSC_SUCCESS); 3152eede4a3fSMark Adams } 3153eede4a3fSMark Adams 3154ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3155d71ae5a4SJacob Faibussowitsch { 3156985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3157d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3158985db425SBarry Smith PetscScalar *x; 3159ce496241SStefano Zampini const MatScalar *aa, *av; 3160985db425SBarry Smith 3161985db425SBarry Smith PetscFunctionBegin; 316228b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3164ce496241SStefano Zampini aa = av; 3165985db425SBarry Smith ai = a->i; 3166985db425SBarry Smith aj = a->j; 3167985db425SBarry Smith 31689566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31699566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31709566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 317108401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3172985db425SBarry Smith for (i = 0; i < m; i++) { 31739371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31749371c9d4SSatish Balay ai++; 3175d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31769371c9d4SSatish Balay x[i] = *aa; 31779371c9d4SSatish Balay if (idx) idx[i] = 0; 3178985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3179985db425SBarry Smith x[i] = 0.0; 3180985db425SBarry Smith if (idx) { 3181985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3182985db425SBarry Smith if (aj[j] > j) { 3183985db425SBarry Smith idx[i] = j; 3184985db425SBarry Smith break; 3185985db425SBarry Smith } 3186985db425SBarry Smith } 31871a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31881a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3189985db425SBarry Smith } 3190985db425SBarry Smith } 3191985db425SBarry Smith for (j = 0; j < ncols; j++) { 31929371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31939371c9d4SSatish Balay x[i] = *aa; 31949371c9d4SSatish Balay if (idx) idx[i] = *aj; 31959371c9d4SSatish Balay } 31969371c9d4SSatish Balay aa++; 31979371c9d4SSatish Balay aj++; 3198985db425SBarry Smith } 3199985db425SBarry Smith } 32009566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3203985db425SBarry Smith } 3204985db425SBarry Smith 3205ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3206d71ae5a4SJacob Faibussowitsch { 3207c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3208c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3209ce496241SStefano Zampini PetscScalar *x; 3210ce496241SStefano Zampini const MatScalar *aa, *av; 3211c87e5d42SMatthew Knepley 3212c87e5d42SMatthew Knepley PetscFunctionBegin; 32139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3214ce496241SStefano Zampini aa = av; 3215c87e5d42SMatthew Knepley ai = a->i; 3216c87e5d42SMatthew Knepley aj = a->j; 3217c87e5d42SMatthew Knepley 32189566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32199566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32209566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 322108401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3222c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 32239371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32249371c9d4SSatish Balay ai++; 3225f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32269371c9d4SSatish Balay x[i] = *aa; 32279371c9d4SSatish Balay if (idx) idx[i] = 0; 3228f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3229f07e67edSHong Zhang x[i] = 0.0; 3230f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3231289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3232f07e67edSHong Zhang if (aj[j] > j) { 3233f07e67edSHong Zhang idx[i] = j; 32342205254eSKarl Rupp break; 32352205254eSKarl Rupp } 3236289a08f5SMatthew Knepley } 3237f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3238f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3239f07e67edSHong Zhang } 3240289a08f5SMatthew Knepley } 3241c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32429371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32439371c9d4SSatish Balay x[i] = *aa; 32449371c9d4SSatish Balay if (idx) idx[i] = *aj; 32459371c9d4SSatish Balay } 32469371c9d4SSatish Balay aa++; 32479371c9d4SSatish Balay aj++; 3248c87e5d42SMatthew Knepley } 3249c87e5d42SMatthew Knepley } 32509566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3253c87e5d42SMatthew Knepley } 3254c87e5d42SMatthew Knepley 3255ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3256d71ae5a4SJacob Faibussowitsch { 3257985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3258d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3259d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3260985db425SBarry Smith PetscScalar *x; 3261ce496241SStefano Zampini const MatScalar *aa, *av; 3262985db425SBarry Smith 3263985db425SBarry Smith PetscFunctionBegin; 326428b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3266ce496241SStefano Zampini aa = av; 3267985db425SBarry Smith ai = a->i; 3268985db425SBarry Smith aj = a->j; 3269985db425SBarry Smith 32709566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32719566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32729566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 327308401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3274985db425SBarry Smith for (i = 0; i < m; i++) { 32759371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32769371c9d4SSatish Balay ai++; 3277d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32789371c9d4SSatish Balay x[i] = *aa; 32799371c9d4SSatish Balay if (idx) idx[i] = 0; 3280985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3281985db425SBarry Smith x[i] = 0.0; 3282985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3283985db425SBarry Smith for (j = 0; j < ncols; j++) { 3284985db425SBarry Smith if (aj[j] > j) { 3285985db425SBarry Smith idx[i] = j; 3286985db425SBarry Smith break; 3287985db425SBarry Smith } 3288985db425SBarry Smith } 3289fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3290fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3291985db425SBarry Smith } 3292985db425SBarry Smith } 3293985db425SBarry Smith for (j = 0; j < ncols; j++) { 32949371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32959371c9d4SSatish Balay x[i] = *aa; 32969371c9d4SSatish Balay if (idx) idx[i] = *aj; 32979371c9d4SSatish Balay } 32989371c9d4SSatish Balay aa++; 32999371c9d4SSatish Balay aj++; 3300e34fafa9SBarry Smith } 3301e34fafa9SBarry Smith } 33029566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 33039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 33043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3305e34fafa9SBarry Smith } 3306bbead8a2SBarry Smith 3307ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3308d71ae5a4SJacob Faibussowitsch { 3309bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 331033d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3311bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 33120da83c2eSBarry Smith const PetscReal shift = 0.0; 33131a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3314bbead8a2SBarry Smith 3315bbead8a2SBarry Smith PetscFunctionBegin; 3316a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 33174a0d0026SBarry Smith if (a->ibdiagvalid) { 33184a0d0026SBarry Smith if (values) *values = a->ibdiag; 33193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 33204a0d0026SBarry Smith } 33219566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 33224dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3323bbead8a2SBarry Smith diag = a->ibdiag; 3324bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3325bbead8a2SBarry Smith /* factor and invert each block */ 3326bbead8a2SBarry Smith switch (bs) { 3327bbead8a2SBarry Smith case 1: 3328bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33299566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3330ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3331ec1892c8SHong Zhang if (allowzeropivot) { 33327b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33337b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33347b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33359566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 333698921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3337ec1892c8SHong Zhang } 3338bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3339bbead8a2SBarry Smith } 3340bbead8a2SBarry Smith break; 3341bbead8a2SBarry Smith case 2: 3342bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33439371c9d4SSatish Balay ij[0] = 2 * i; 33449371c9d4SSatish Balay ij[1] = 2 * i + 1; 33459566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33469566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33477b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33489566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3349bbead8a2SBarry Smith diag += 4; 3350bbead8a2SBarry Smith } 3351bbead8a2SBarry Smith break; 3352bbead8a2SBarry Smith case 3: 3353bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33549371c9d4SSatish Balay ij[0] = 3 * i; 33559371c9d4SSatish Balay ij[1] = 3 * i + 1; 33569371c9d4SSatish Balay ij[2] = 3 * i + 2; 33579566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33589566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33597b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3361bbead8a2SBarry Smith diag += 9; 3362bbead8a2SBarry Smith } 3363bbead8a2SBarry Smith break; 3364bbead8a2SBarry Smith case 4: 3365bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33669371c9d4SSatish Balay ij[0] = 4 * i; 33679371c9d4SSatish Balay ij[1] = 4 * i + 1; 33689371c9d4SSatish Balay ij[2] = 4 * i + 2; 33699371c9d4SSatish Balay ij[3] = 4 * i + 3; 33709566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33719566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33727b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33739566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3374bbead8a2SBarry Smith diag += 16; 3375bbead8a2SBarry Smith } 3376bbead8a2SBarry Smith break; 3377bbead8a2SBarry Smith case 5: 3378bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33799371c9d4SSatish Balay ij[0] = 5 * i; 33809371c9d4SSatish Balay ij[1] = 5 * i + 1; 33819371c9d4SSatish Balay ij[2] = 5 * i + 2; 33829371c9d4SSatish Balay ij[3] = 5 * i + 3; 33839371c9d4SSatish Balay ij[4] = 5 * i + 4; 33849566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33859566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33867b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33879566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3388bbead8a2SBarry Smith diag += 25; 3389bbead8a2SBarry Smith } 3390bbead8a2SBarry Smith break; 3391bbead8a2SBarry Smith case 6: 3392bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33939371c9d4SSatish Balay ij[0] = 6 * i; 33949371c9d4SSatish Balay ij[1] = 6 * i + 1; 33959371c9d4SSatish Balay ij[2] = 6 * i + 2; 33969371c9d4SSatish Balay ij[3] = 6 * i + 3; 33979371c9d4SSatish Balay ij[4] = 6 * i + 4; 33989371c9d4SSatish Balay ij[5] = 6 * i + 5; 33999566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 34009566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 34017b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34029566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3403bbead8a2SBarry Smith diag += 36; 3404bbead8a2SBarry Smith } 3405bbead8a2SBarry Smith break; 3406bbead8a2SBarry Smith case 7: 3407bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 34089371c9d4SSatish Balay ij[0] = 7 * i; 34099371c9d4SSatish Balay ij[1] = 7 * i + 1; 34109371c9d4SSatish Balay ij[2] = 7 * i + 2; 34119371c9d4SSatish Balay ij[3] = 7 * i + 3; 34129371c9d4SSatish Balay ij[4] = 7 * i + 4; 34139371c9d4SSatish Balay ij[5] = 7 * i + 5; 3414cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 34159566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 34169566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 34177b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34189566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3419bbead8a2SBarry Smith diag += 49; 3420bbead8a2SBarry Smith } 3421bbead8a2SBarry Smith break; 3422bbead8a2SBarry Smith default: 34239566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3424bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3425ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34269566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34279566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34287b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34299566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3430bbead8a2SBarry Smith diag += bs2; 3431bbead8a2SBarry Smith } 34329566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3433bbead8a2SBarry Smith } 3434bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 34353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3436bbead8a2SBarry Smith } 3437bbead8a2SBarry Smith 3438d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3439d71ae5a4SJacob Faibussowitsch { 344073a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3441fff043a9SJunchao Zhang PetscScalar a, *aa; 344273a71a0fSBarry Smith PetscInt m, n, i, j, col; 344373a71a0fSBarry Smith 344473a71a0fSBarry Smith PetscFunctionBegin; 344573a71a0fSBarry Smith if (!x->assembled) { 34469566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 344773a71a0fSBarry Smith for (i = 0; i < m; i++) { 344873a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34499566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 345073a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34519566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 345273a71a0fSBarry Smith } 345373a71a0fSBarry Smith } 3454e2ce353bSJunchao Zhang } else { 34559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34569566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3458e2ce353bSJunchao Zhang } 34599566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34609566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 346273a71a0fSBarry Smith } 346373a71a0fSBarry Smith 3464679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3465d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3466d71ae5a4SJacob Faibussowitsch { 3467679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3468679944adSJunchao Zhang PetscScalar a; 3469679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3470679944adSJunchao Zhang 3471679944adSJunchao Zhang PetscFunctionBegin; 3472679944adSJunchao Zhang nskip = high - low; 34739566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3474679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3475679944adSJunchao Zhang for (i = 0; i < m; i++) { 3476679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34779566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3478679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3479679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34809566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3481679944adSJunchao Zhang } 3482e2ce353bSJunchao Zhang } 34839566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34849566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3486679944adSJunchao Zhang } 3487679944adSJunchao Zhang 34880a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3489cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3490cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3491cb5b572fSBarry Smith MatMult_SeqAIJ, 349297304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34937c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34947c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3495f4259b30SLisandro Dalcin NULL, 3496f4259b30SLisandro Dalcin NULL, 3497f4259b30SLisandro Dalcin NULL, 3498f4259b30SLisandro Dalcin /* 10*/ NULL, 3499cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3500f4259b30SLisandro Dalcin NULL, 350141f059aeSBarry Smith MatSOR_SeqAIJ, 350291e9d3e2SHong Zhang MatTranspose_SeqAIJ, 350397304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3504cb5b572fSBarry Smith MatEqual_SeqAIJ, 3505cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3506cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3507cb5b572fSBarry Smith MatNorm_SeqAIJ, 3508f4259b30SLisandro Dalcin /* 20*/ NULL, 3509cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3510cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3511cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3512d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3513f4259b30SLisandro Dalcin NULL, 3514f4259b30SLisandro Dalcin NULL, 3515f4259b30SLisandro Dalcin NULL, 3516f4259b30SLisandro Dalcin NULL, 351726cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 3518f4259b30SLisandro Dalcin NULL, 3519f4259b30SLisandro Dalcin NULL, 3520f4259b30SLisandro Dalcin NULL, 3521f4259b30SLisandro Dalcin NULL, 3522d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3523f4259b30SLisandro Dalcin NULL, 3524f4259b30SLisandro Dalcin NULL, 3525cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3526f4259b30SLisandro Dalcin NULL, 3527d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35287dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3529cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3530cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3531cb5b572fSBarry Smith MatCopy_SeqAIJ, 3532d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3533cb5b572fSBarry Smith MatScale_SeqAIJ, 35347d68702bSBarry Smith MatShift_SeqAIJ, 353579299369SBarry Smith MatDiagonalSet_SeqAIJ, 35366e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 353773a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35383b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35393b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35403b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3541a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 354293dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3543f4259b30SLisandro Dalcin NULL, 3544f4259b30SLisandro Dalcin NULL, 3545cda55fadSBarry Smith MatPermute_SeqAIJ, 3546f4259b30SLisandro Dalcin NULL, 3547f4259b30SLisandro Dalcin /* 59*/ NULL, 3548b9b97703SBarry Smith MatDestroy_SeqAIJ, 3549b9b97703SBarry Smith MatView_SeqAIJ, 3550f4259b30SLisandro Dalcin NULL, 3551f4259b30SLisandro Dalcin NULL, 3552f4259b30SLisandro Dalcin /* 64*/ NULL, 3553321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3554f4259b30SLisandro Dalcin NULL, 3555f4259b30SLisandro Dalcin NULL, 3556f4259b30SLisandro Dalcin NULL, 3557d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3558c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3559f4259b30SLisandro Dalcin NULL, 3560f4259b30SLisandro Dalcin NULL, 3561f4259b30SLisandro Dalcin NULL, 3562f4259b30SLisandro Dalcin /* 74*/ NULL, 35633acb8795SBarry Smith MatFDColoringApply_AIJ, 3564f4259b30SLisandro Dalcin NULL, 3565f4259b30SLisandro Dalcin NULL, 3566f4259b30SLisandro Dalcin NULL, 35676ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3568f4259b30SLisandro Dalcin NULL, 3569f4259b30SLisandro Dalcin NULL, 3570f4259b30SLisandro Dalcin NULL, 3571bc011b1eSHong Zhang MatLoad_SeqAIJ, 3572*6cff0a6bSPierre Jolivet /* 84*/ NULL, 3573*6cff0a6bSPierre Jolivet NULL, 3574f4259b30SLisandro Dalcin NULL, 3575f4259b30SLisandro Dalcin NULL, 3576f4259b30SLisandro Dalcin NULL, 3577f4259b30SLisandro Dalcin /* 89*/ NULL, 3578f4259b30SLisandro Dalcin NULL, 357926be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3580f4259b30SLisandro Dalcin NULL, 3581f4259b30SLisandro Dalcin NULL, 35828fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3583f4259b30SLisandro Dalcin NULL, 3584f4259b30SLisandro Dalcin NULL, 35856fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3586f4259b30SLisandro Dalcin NULL, 35874222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3588f4259b30SLisandro Dalcin NULL, 3589f4259b30SLisandro Dalcin NULL, 359087d4246cSBarry Smith MatConjugate_SeqAIJ, 3591f4259b30SLisandro Dalcin NULL, 3592d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 359399cafbc1SBarry Smith MatRealPart_SeqAIJ, 3594f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3595f4259b30SLisandro Dalcin NULL, 3596f4259b30SLisandro Dalcin NULL, 3597cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3598f4259b30SLisandro Dalcin NULL, 35992af78befSBarry Smith MatGetRowMin_SeqAIJ, 3600f4259b30SLisandro Dalcin NULL, 3601599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3602f4259b30SLisandro Dalcin /*114*/ NULL, 3603f4259b30SLisandro Dalcin NULL, 3604f4259b30SLisandro Dalcin NULL, 3605f4259b30SLisandro Dalcin NULL, 3606f4259b30SLisandro Dalcin NULL, 3607f4259b30SLisandro Dalcin /*119*/ NULL, 3608f4259b30SLisandro Dalcin NULL, 3609f4259b30SLisandro Dalcin NULL, 3610f4259b30SLisandro Dalcin NULL, 3611b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 36120716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3613a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 361437868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 36150da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3616f4259b30SLisandro Dalcin NULL, 3617f4259b30SLisandro Dalcin /*129*/ NULL, 3618f4259b30SLisandro Dalcin NULL, 3619f4259b30SLisandro Dalcin NULL, 362075648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3621b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3622b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36232b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3624f4259b30SLisandro Dalcin NULL, 3625f4259b30SLisandro Dalcin NULL, 36263964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3627f4259b30SLisandro Dalcin /*139*/ NULL, 3628f4259b30SLisandro Dalcin NULL, 3629f4259b30SLisandro Dalcin NULL, 36303a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36319c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36324222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36334222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3634f4259b30SLisandro Dalcin NULL, 363572833a62Smarkadams4 NULL, 363672833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36372d776b49SBarry Smith NULL, 3638dec0b466SHong Zhang /*150*/ MatTransposeSymbolic_SeqAIJ, 3639eede4a3fSMark Adams MatEliminateZeros_SeqAIJ, 3640eede4a3fSMark Adams MatGetRowSumAbs_SeqAIJ}; 364117ab2063SBarry Smith 3642ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3643d71ae5a4SJacob Faibussowitsch { 3644bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 364597f1f81fSBarry Smith PetscInt i, nz, n; 3646bef8e0ddSBarry Smith 3647bef8e0ddSBarry Smith PetscFunctionBegin; 3648bef8e0ddSBarry Smith nz = aij->maxnz; 3649d0f46423SBarry Smith n = mat->rmap->n; 3650ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3651bef8e0ddSBarry Smith aij->nz = nz; 3652ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 36533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3654bef8e0ddSBarry Smith } 3655bef8e0ddSBarry Smith 3656a3bb6f32SFande Kong /* 3657ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3658ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3659ddea5d60SJunchao Zhang */ 3660d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3661d71ae5a4SJacob Faibussowitsch { 3662a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3663eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3664eec179cfSJacob Faibussowitsch PetscHashIter tpos; 366525b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 366625b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3667a3bb6f32SFande Kong 3668a3bb6f32SFande Kong PetscFunctionBegin; 3669a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 36704f572ea9SToby Isaac PetscAssertPointer(mapping, 2); 3671a3bb6f32SFande Kong /* use a table */ 3672eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3673a3bb6f32SFande Kong ec = 0; 367425b670f0SStefano Zampini for (i = 0; i < nz; i++) { 367525b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3676eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3677a3bb6f32SFande Kong if (!data) { 3678a3bb6f32SFande Kong /* one based table */ 3679c76ffc5fSJacob Faibussowitsch PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec)); 3680a3bb6f32SFande Kong } 3681a3bb6f32SFande Kong } 3682a3bb6f32SFande Kong /* form array of columns we need */ 36839566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3684eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3685eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3686eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3687eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3688eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3689a3bb6f32SFande Kong gid--; 3690a3bb6f32SFande Kong lid--; 3691a3bb6f32SFande Kong garray[lid] = gid; 3692a3bb6f32SFande Kong } 36939566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3694eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3695c76ffc5fSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1)); 3696a3bb6f32SFande Kong /* compact out the extra columns in B */ 369725b670f0SStefano Zampini for (i = 0; i < nz; i++) { 369825b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3699eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3700a3bb6f32SFande Kong lid--; 370125b670f0SStefano Zampini jj[i] = lid; 3702a3bb6f32SFande Kong } 37039566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3704eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 37059566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 37069566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 37079566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 37083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3709a3bb6f32SFande Kong } 3710a3bb6f32SFande Kong 3711bef8e0ddSBarry Smith /*@ 3712bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3713bef8e0ddSBarry Smith in the matrix. 3714bef8e0ddSBarry Smith 3715bef8e0ddSBarry Smith Input Parameters: 371611a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3717bef8e0ddSBarry Smith - indices - the column indices 3718bef8e0ddSBarry Smith 371915091d37SBarry Smith Level: advanced 372015091d37SBarry Smith 3721bef8e0ddSBarry Smith Notes: 3722bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3723bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 372411a5261eSBarry Smith of the `MatSetValues()` operation. 3725bef8e0ddSBarry Smith 3726bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 372711a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3728bef8e0ddSBarry Smith 372911a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3730bef8e0ddSBarry Smith 3731b9617806SBarry Smith The indices should start with zero, not one. 3732b9617806SBarry Smith 37331cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ` 3734bef8e0ddSBarry Smith @*/ 3735d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3736d71ae5a4SJacob Faibussowitsch { 3737bef8e0ddSBarry Smith PetscFunctionBegin; 37380700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 37394f572ea9SToby Isaac PetscAssertPointer(indices, 2); 3740cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 37413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3742bef8e0ddSBarry Smith } 3743bef8e0ddSBarry Smith 3744ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3745d71ae5a4SJacob Faibussowitsch { 3746be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3747d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3748be6bf707SBarry Smith 3749be6bf707SBarry Smith PetscFunctionBegin; 375028b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3751be6bf707SBarry Smith 3752be6bf707SBarry Smith /* allocate space for values if not already there */ 37534dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3754be6bf707SBarry Smith 3755be6bf707SBarry Smith /* copy values over */ 37569566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 37573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3758be6bf707SBarry Smith } 3759be6bf707SBarry Smith 3760be6bf707SBarry Smith /*@ 376120f4b53cSBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the 3762be6bf707SBarry Smith nonlinear portion. 3763be6bf707SBarry Smith 3764c3339decSBarry Smith Logically Collect 3765be6bf707SBarry Smith 376627430b45SBarry Smith Input Parameter: 376711a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3768be6bf707SBarry Smith 376915091d37SBarry Smith Level: advanced 377015091d37SBarry Smith 37712920cce0SJacob Faibussowitsch Example Usage: 377227430b45SBarry Smith .vb 37732ef1f0ffSBarry Smith Using SNES 377427430b45SBarry Smith Create Jacobian matrix 377527430b45SBarry Smith Set linear terms into matrix 377627430b45SBarry Smith Apply boundary conditions to matrix, at this time matrix must have 377727430b45SBarry Smith final nonzero structure (i.e. setting the nonlinear terms and applying 377827430b45SBarry Smith boundary conditions again will not change the nonzero structure 377927430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 378027430b45SBarry Smith MatStoreValues(mat); 378127430b45SBarry Smith Call SNESSetJacobian() with matrix 378227430b45SBarry Smith In your Jacobian routine 378327430b45SBarry Smith MatRetrieveValues(mat); 378427430b45SBarry Smith Set nonlinear terms in matrix 3785be6bf707SBarry Smith 378627430b45SBarry Smith Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself: 378727430b45SBarry Smith // build linear portion of Jacobian 378827430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 378927430b45SBarry Smith MatStoreValues(mat); 379027430b45SBarry Smith loop over nonlinear iterations 379127430b45SBarry Smith MatRetrieveValues(mat); 379227430b45SBarry Smith // call MatSetValues(mat,...) to set nonliner portion of Jacobian 379327430b45SBarry Smith // call MatAssemblyBegin/End() on matrix 379427430b45SBarry Smith Solve linear system with Jacobian 379527430b45SBarry Smith endloop 379627430b45SBarry Smith .ve 3797be6bf707SBarry Smith 3798be6bf707SBarry Smith Notes: 3799da81f932SPierre Jolivet Matrix must already be assembled before calling this routine 380011a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3801be6bf707SBarry Smith calling this routine. 3802be6bf707SBarry Smith 38030c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 38040c468ba9SBarry Smith and does not allocated additional space. 38050c468ba9SBarry Smith 3806fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()` 3807be6bf707SBarry Smith @*/ 3808d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3809d71ae5a4SJacob Faibussowitsch { 3810be6bf707SBarry Smith PetscFunctionBegin; 38110700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 381228b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 381328b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3814cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 38153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3816be6bf707SBarry Smith } 3817be6bf707SBarry Smith 3818ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3819d71ae5a4SJacob Faibussowitsch { 3820be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3821d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3822be6bf707SBarry Smith 3823be6bf707SBarry Smith PetscFunctionBegin; 382428b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 382528b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3826be6bf707SBarry Smith /* copy values over */ 38279566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 38283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3829be6bf707SBarry Smith } 3830be6bf707SBarry Smith 3831be6bf707SBarry Smith /*@ 383220f4b53cSBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()` 3833be6bf707SBarry Smith 3834c3339decSBarry Smith Logically Collect 3835be6bf707SBarry Smith 38362fe279fdSBarry Smith Input Parameter: 383711a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3838be6bf707SBarry Smith 383915091d37SBarry Smith Level: advanced 384015091d37SBarry Smith 38411cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()` 3842be6bf707SBarry Smith @*/ 3843d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3844d71ae5a4SJacob Faibussowitsch { 3845be6bf707SBarry Smith PetscFunctionBegin; 38460700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 384728b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 384828b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3849cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 38503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3851be6bf707SBarry Smith } 3852be6bf707SBarry Smith 385317ab2063SBarry Smith /*@C 385411a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38550d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 385620f4b53cSBarry Smith the user should preallocate the matrix storage by setting the parameter `nz` 385720f4b53cSBarry Smith (or the array `nnz`). 385817ab2063SBarry Smith 3859d083f849SBarry Smith Collective 3860db81eaa0SLois Curfman McInnes 386117ab2063SBarry Smith Input Parameters: 386211a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 386317ab2063SBarry Smith . m - number of rows 386417ab2063SBarry Smith . n - number of columns 386517ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 386651c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38670298fd71SBarry Smith (possibly different for each row) or NULL 386817ab2063SBarry Smith 386917ab2063SBarry Smith Output Parameter: 3870416022c9SBarry Smith . A - the matrix 387117ab2063SBarry Smith 38722ef1f0ffSBarry Smith Options Database Keys: 38732ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 38742ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 38752ef1f0ffSBarry Smith 38762ef1f0ffSBarry Smith Level: intermediate 3877175b88e8SBarry Smith 3878b259b22eSLois Curfman McInnes Notes: 387977433607SBarry Smith It is recommend to use `MatCreateFromOptions()` instead of this routine 388077433607SBarry Smith 38812ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 388249a6f317SBarry Smith 38832ef1f0ffSBarry Smith The `MATSEQAIJ` format, also called 38842ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 38850002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 38862ef1f0ffSBarry Smith either one (as in Fortran) or zero. 388717ab2063SBarry Smith 388820f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 38892ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 389020f4b53cSBarry Smith allocation. 389117ab2063SBarry Smith 3892682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38934fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3894682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38956c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38966c7ebb05SLois Curfman McInnes 38971cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 389817ab2063SBarry Smith @*/ 3899d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3900d71ae5a4SJacob Faibussowitsch { 39013a40ed3dSBarry Smith PetscFunctionBegin; 39029566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 39039566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 39049566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 39059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 39063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3907273d9f13SBarry Smith } 3908273d9f13SBarry Smith 3909273d9f13SBarry Smith /*@C 3910273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3911273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3912273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3913273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3914273d9f13SBarry Smith 3915d083f849SBarry Smith Collective 3916273d9f13SBarry Smith 3917273d9f13SBarry Smith Input Parameters: 39181c4f3114SJed Brown + B - The matrix 3919273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3920273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39210298fd71SBarry Smith (possibly different for each row) or NULL 3922273d9f13SBarry Smith 39232ef1f0ffSBarry Smith Options Database Keys: 39242ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 39252ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 39262ef1f0ffSBarry Smith 39272ef1f0ffSBarry Smith Level: intermediate 39282ef1f0ffSBarry Smith 3929273d9f13SBarry Smith Notes: 39302ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 393149a6f317SBarry Smith 393211a5261eSBarry Smith The `MATSEQAIJ` format also called 39332ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 3934273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3935273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3936273d9f13SBarry Smith 39372ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 39382ef1f0ffSBarry Smith Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 39392ef1f0ffSBarry Smith allocation. 3940273d9f13SBarry Smith 394111a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3942aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3943aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3944aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3945aa95bbe8SBarry Smith 394611a5261eSBarry Smith Developer Notes: 394711a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3948a96a251dSBarry Smith entries or columns indices 3949a96a251dSBarry Smith 3950273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3951273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3952273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3953273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3954273d9f13SBarry Smith 39551cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3956db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3957273d9f13SBarry Smith @*/ 3958d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3959d71ae5a4SJacob Faibussowitsch { 3960a23d5eceSKris Buschelman PetscFunctionBegin; 39616ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39626ba663aaSJed Brown PetscValidType(B, 1); 3963cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 39643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3965a23d5eceSKris Buschelman } 3966a23d5eceSKris Buschelman 3967d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3968d71ae5a4SJacob Faibussowitsch { 3969ad79cf63SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 39702576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 397197f1f81fSBarry Smith PetscInt i; 3972273d9f13SBarry Smith 3973273d9f13SBarry Smith PetscFunctionBegin; 3974ad79cf63SBarry Smith if (B->hash_active) { 3975aea10558SJacob Faibussowitsch B->ops[0] = b->cops; 3976ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 3977ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 3978ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 3979ad79cf63SBarry Smith } 39802576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3981a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3982c461c341SBarry Smith skipallocation = PETSC_TRUE; 3983c461c341SBarry Smith nz = 0; 3984c461c341SBarry Smith } 39859566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39869566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3987899cda47SBarry Smith 3988435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 398908401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 3990cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3991d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 399208401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 399308401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3994b73539f3SBarry Smith } 3995b73539f3SBarry Smith } 3996b73539f3SBarry Smith 3997273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 3998ab93d7beSBarry Smith if (!skipallocation) { 39994dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 4000071fcb05SBarry Smith if (!b->ilen) { 4001071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 40029566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 4003071fcb05SBarry Smith } else { 40049566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 40052ee49352SLisandro Dalcin } 4006aa624791SPierre Jolivet if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); 4007273d9f13SBarry Smith if (!nnz) { 4008435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 4009c62bd62aSJed Brown else if (nz < 0) nz = 1; 40105d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 4011d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 4012c43c4a61SBarry Smith PetscCall(PetscIntMultError(nz, B->rmap->n, &nz)); 4013273d9f13SBarry Smith } else { 4014c73702f5SBarry Smith PetscInt64 nz64 = 0; 40159371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 40169371c9d4SSatish Balay b->imax[i] = nnz[i]; 40179371c9d4SSatish Balay nz64 += nnz[i]; 40189371c9d4SSatish Balay } 40199566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 4020273d9f13SBarry Smith } 4021ab93d7beSBarry Smith 4022273d9f13SBarry Smith /* allocate the matrix space */ 402353dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 40249566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 4025396832f4SHong Zhang if (B->structure_only) { 40269566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &b->j)); 40279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i)); 4028396832f4SHong Zhang } else { 40299566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i)); 4030396832f4SHong Zhang } 4031bfeeae90SHong Zhang b->i[0] = 0; 4032ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4033396832f4SHong Zhang if (B->structure_only) { 4034396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4035396832f4SHong Zhang b->free_a = PETSC_FALSE; 4036396832f4SHong Zhang } else { 4037273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4038e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4039396832f4SHong Zhang } 4040e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4041c461c341SBarry Smith } else { 4042e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4043e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4044c461c341SBarry Smith } 4045273d9f13SBarry Smith 4046846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4047846b4da1SFande Kong /* reserve user-requested sparsity */ 40489566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4049846b4da1SFande Kong } 4050846b4da1SFande Kong 4051273d9f13SBarry Smith b->nz = 0; 4052273d9f13SBarry Smith b->maxnz = nz; 4053273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40541baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4055cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4056cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40575519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40585519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40595519a089SJose E. Roman */ 40605519a089SJose E. Roman B->nonzerostate++; 40613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4062273d9f13SBarry Smith } 4063273d9f13SBarry Smith 4064ba38deedSJacob Faibussowitsch static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4065d71ae5a4SJacob Faibussowitsch { 4066846b4da1SFande Kong Mat_SeqAIJ *a; 4067a5bbaf83SFande Kong PetscInt i; 40681f14be2bSBarry Smith PetscBool skipreset; 4069846b4da1SFande Kong 4070846b4da1SFande Kong PetscFunctionBegin; 4071846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 407214d0e64fSAlex Lindsay 407314d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 40743ba16761SJacob Faibussowitsch if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS); 407514d0e64fSAlex Lindsay 4076846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40772c814fdeSFande Kong /* if no saved info, we error out */ 407828b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40792c814fdeSFande Kong 40801f14be2bSBarry Smith PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40812c814fdeSFande Kong 40821f14be2bSBarry Smith PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset)); 40831f14be2bSBarry Smith if (!skipreset) { 40849566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40859566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4086846b4da1SFande Kong a->i[0] = 0; 4087ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4088846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4089846b4da1SFande Kong a->nz = 0; 4090846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4091846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4092846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4093846b4da1SFande Kong A->assembled = PETSC_FALSE; 40941f14be2bSBarry Smith } 40953ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4096846b4da1SFande Kong } 4097846b4da1SFande Kong 409858d36128SBarry Smith /*@ 409911a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4100a1661176SMatthew Knepley 4101a1661176SMatthew Knepley Input Parameters: 4102a1661176SMatthew Knepley + B - the matrix 4103d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero) 4104d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row 4105d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided 4106a1661176SMatthew Knepley 4107a1661176SMatthew Knepley Level: developer 4108a1661176SMatthew Knepley 41096a9b8d82SBarry Smith Notes: 41102ef1f0ffSBarry Smith The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 411158d36128SBarry Smith 41126a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 41136a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 41146a9b8d82SBarry Smith 41156a9b8d82SBarry Smith Developer Notes: 41162ef1f0ffSBarry Smith An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and 41172ef1f0ffSBarry Smith then just copies the `v` values directly with `PetscMemcpy()`. 41186a9b8d82SBarry Smith 411911a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 41206a9b8d82SBarry Smith 4121fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()` 4122a1661176SMatthew Knepley @*/ 4123d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4124d71ae5a4SJacob Faibussowitsch { 4125a1661176SMatthew Knepley PetscFunctionBegin; 41260700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 41276ba663aaSJed Brown PetscValidType(B, 1); 4128cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 41293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4130a1661176SMatthew Knepley } 4131a1661176SMatthew Knepley 4132ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4133d71ae5a4SJacob Faibussowitsch { 4134a1661176SMatthew Knepley PetscInt i; 4135a1661176SMatthew Knepley PetscInt m, n; 4136a1661176SMatthew Knepley PetscInt nz; 41376a9b8d82SBarry Smith PetscInt *nnz; 4138a1661176SMatthew Knepley 4139a1661176SMatthew Knepley PetscFunctionBegin; 4140aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4141779a8d59SSatish Balay 41429566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41439566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4144779a8d59SSatish Balay 41459566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41469566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4147a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4148b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 414908401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4150a1661176SMatthew Knepley nnz[i] = nz; 4151a1661176SMatthew Knepley } 41529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41539566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4154a1661176SMatthew Knepley 41558e3a54c0SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES)); 4156a1661176SMatthew Knepley 41579566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41589566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4159a1661176SMatthew Knepley 41609566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 41613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4162a1661176SMatthew Knepley } 4163a1661176SMatthew Knepley 4164ad7e164aSPierre Jolivet /*@ 41652ef1f0ffSBarry Smith MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`. 4166ad7e164aSPierre Jolivet 4167ad7e164aSPierre Jolivet Input Parameters: 4168ad7e164aSPierre Jolivet + A - left-hand side matrix 4169ad7e164aSPierre Jolivet . B - right-hand side matrix 417011a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4171ad7e164aSPierre Jolivet 4172ad7e164aSPierre Jolivet Output Parameter: 41732ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B` 4174ad7e164aSPierre Jolivet 4175ad7e164aSPierre Jolivet Level: intermediate 4176ad7e164aSPierre Jolivet 417711a5261eSBarry Smith Note: 417811a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4179ad7e164aSPierre Jolivet 41801cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4181ad7e164aSPierre Jolivet @*/ 4182d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4183d71ae5a4SJacob Faibussowitsch { 4184ad7e164aSPierre Jolivet PetscFunctionBegin; 4185ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4186ad7e164aSPierre Jolivet PetscValidType(A, 1); 4187ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4188ad7e164aSPierre Jolivet PetscValidType(B, 2); 41894f572ea9SToby Isaac PetscAssertPointer(C, 4); 4190ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4191ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4192ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4193ad7e164aSPierre Jolivet } 4194cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 41953ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4196ad7e164aSPierre Jolivet } 4197ad7e164aSPierre Jolivet 4198ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4199d71ae5a4SJacob Faibussowitsch { 4200ad7e164aSPierre Jolivet Mat newmat; 4201ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4202ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4203ad7e164aSPierre Jolivet PetscScalar *v; 4204fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4205ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4206ad7e164aSPierre Jolivet PetscBool flg; 4207ad7e164aSPierre Jolivet 4208ad7e164aSPierre Jolivet PetscFunctionBegin; 420928b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 421028b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 421128b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 421228b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 42139566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 421428b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4215aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4216ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 42179566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 42189566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 42199566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 42209566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4221ad7e164aSPierre Jolivet i[0] = 0; 4222ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4223ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4224ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4225ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4226ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4227ad7e164aSPierre Jolivet } 4228ad7e164aSPierre Jolivet } 4229ad7e164aSPierre Jolivet } 42309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4231ad7e164aSPierre Jolivet *C = newmat; 42329566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4233ad7e164aSPierre Jolivet nnz = 0; 4234ad7e164aSPierre Jolivet } 42359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4238ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4239ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4240ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4241ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4242ad7e164aSPierre Jolivet } 4243ad7e164aSPierre Jolivet } 4244ad7e164aSPierre Jolivet } 42459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 42483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4249ad7e164aSPierre Jolivet } 4250ad7e164aSPierre Jolivet 4251c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4252af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4253170fe5c8SBarry Smith 4254170fe5c8SBarry Smith /* 4255170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4256170fe5c8SBarry Smith 4257170fe5c8SBarry Smith n p p 42582da392ccSBarry Smith [ ] [ ] [ ] 42592da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42602da392ccSBarry Smith [ ] [ ] [ ] 4261170fe5c8SBarry Smith 4262170fe5c8SBarry Smith */ 4263d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4264d71ae5a4SJacob Faibussowitsch { 4265170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4266170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4267170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 426886214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4269170fe5c8SBarry Smith const PetscInt *ii, *idx; 4270170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4271170fe5c8SBarry Smith PetscScalar *c, *c_q; 427286214ceeSStefano Zampini PetscInt clda = sub_c->lda; 427386214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4274170fe5c8SBarry Smith 4275170fe5c8SBarry Smith PetscFunctionBegin; 4276d0f46423SBarry Smith m = A->rmap->n; 4277d0f46423SBarry Smith n = A->cmap->n; 4278d0f46423SBarry Smith p = B->cmap->n; 4279170fe5c8SBarry Smith a = sub_a->v; 4280170fe5c8SBarry Smith b = sub_b->a; 4281170fe5c8SBarry Smith c = sub_c->v; 428286214ceeSStefano Zampini if (clda == m) { 42839566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 428486214ceeSStefano Zampini } else { 428586214ceeSStefano Zampini for (j = 0; j < p; j++) 42869371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 428786214ceeSStefano Zampini } 4288170fe5c8SBarry Smith ii = sub_b->i; 4289170fe5c8SBarry Smith idx = sub_b->j; 4290170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4291170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4292170fe5c8SBarry Smith while (q-- > 0) { 429386214ceeSStefano Zampini c_q = c + clda * (*idx); 429486214ceeSStefano Zampini a_q = a + alda * i; 4295854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4296170fe5c8SBarry Smith idx++; 4297170fe5c8SBarry Smith b++; 4298170fe5c8SBarry Smith } 4299170fe5c8SBarry Smith } 43003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4301170fe5c8SBarry Smith } 4302170fe5c8SBarry Smith 4303d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4304d71ae5a4SJacob Faibussowitsch { 4305d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 430686214ceeSStefano Zampini PetscBool cisdense; 4307170fe5c8SBarry Smith 4308170fe5c8SBarry Smith PetscFunctionBegin; 430908401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 43109566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 43119566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 4312d5e393b6SSuyash Tandon PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, "")); 431348a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 43149566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4315d73949e8SHong Zhang 43164222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 43173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4318170fe5c8SBarry Smith } 4319170fe5c8SBarry Smith 43200bad9183SKris Buschelman /*MC 4321fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43220bad9183SKris Buschelman based on compressed sparse row format. 43230bad9183SKris Buschelman 43242ef1f0ffSBarry Smith Options Database Key: 43250bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43260bad9183SKris Buschelman 43270bad9183SKris Buschelman Level: beginner 43280bad9183SKris Buschelman 43290cd7f59aSBarry Smith Notes: 43302ef1f0ffSBarry Smith `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values, 43310cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43320cd7f59aSBarry Smith in the matrix 43330cd7f59aSBarry Smith 433411a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 433511a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43360cd7f59aSBarry Smith 433711a5261eSBarry Smith Developer Note: 43382ef1f0ffSBarry Smith It would be nice if all matrix formats supported passing `NULL` in for the numerical values 43390cd7f59aSBarry Smith 43401cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43410bad9183SKris Buschelman M*/ 43420bad9183SKris Buschelman 4343ccd284c7SBarry Smith /*MC 4344ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4345ccd284c7SBarry Smith 434611a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 434711a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 434811a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4349ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4350ccd284c7SBarry Smith the above preallocation routines for simplicity. 4351ccd284c7SBarry Smith 43522ef1f0ffSBarry Smith Options Database Key: 435311a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4354ccd284c7SBarry Smith 43552ef1f0ffSBarry Smith Level: beginner 43562ef1f0ffSBarry Smith 435711a5261eSBarry Smith Note: 435811a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4359ccd284c7SBarry Smith enough exist. 4360ccd284c7SBarry Smith 43611cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4362ccd284c7SBarry Smith M*/ 4363ccd284c7SBarry Smith 4364ccd284c7SBarry Smith /*MC 4365ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4366ccd284c7SBarry Smith 43672ef1f0ffSBarry Smith Options Database Key: 43682ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 43692ef1f0ffSBarry Smith 43702ef1f0ffSBarry Smith Level: beginner 43712ef1f0ffSBarry Smith 43722ef1f0ffSBarry Smith Note: 437311a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 437411a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 437511a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4376ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4377ccd284c7SBarry Smith the above preallocation routines for simplicity. 4378ccd284c7SBarry Smith 43791cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4380ccd284c7SBarry Smith M*/ 4381ccd284c7SBarry Smith 43827906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43837906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43847906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43857906f579SHong Zhang #endif 4386d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4387d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4388d24d4204SJose E. Roman #endif 43897906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43907906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43917906f579SHong Zhang #endif 43927906f579SHong Zhang 4393d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4394c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43954222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43967906f579SHong Zhang 43978c778c55SBarry Smith /*@C 439811a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43998c778c55SBarry Smith 44008c778c55SBarry Smith Not Collective 44018c778c55SBarry Smith 44028c778c55SBarry Smith Input Parameter: 4403fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44048c778c55SBarry Smith 44058c778c55SBarry Smith Output Parameter: 44068c778c55SBarry Smith . array - pointer to the data 44078c778c55SBarry Smith 44088c778c55SBarry Smith Level: intermediate 44098c778c55SBarry Smith 4410fe59aa6dSJacob Faibussowitsch Fortran Notes: 44110ab4885dSBarry Smith `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()` 44120ab4885dSBarry Smith 44131cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 44148c778c55SBarry Smith @*/ 4415d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array) 4416d71ae5a4SJacob Faibussowitsch { 4417d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44188c778c55SBarry Smith 44198c778c55SBarry Smith PetscFunctionBegin; 4420d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44219566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4422d67d9f35SJunchao Zhang } else { 4423d67d9f35SJunchao Zhang *array = aij->a; 4424d67d9f35SJunchao Zhang } 44253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4426d67d9f35SJunchao Zhang } 4427d67d9f35SJunchao Zhang 4428d67d9f35SJunchao Zhang /*@C 442911a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4430d67d9f35SJunchao Zhang 4431d67d9f35SJunchao Zhang Not Collective 4432d67d9f35SJunchao Zhang 4433d67d9f35SJunchao Zhang Input Parameters: 4434fe59aa6dSJacob Faibussowitsch + A - a `MATSEQAIJ` matrix 4435d67d9f35SJunchao Zhang - array - pointer to the data 4436d67d9f35SJunchao Zhang 4437d67d9f35SJunchao Zhang Level: intermediate 4438d67d9f35SJunchao Zhang 4439fe59aa6dSJacob Faibussowitsch Fortran Notes: 44400ab4885dSBarry Smith `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()` 44410ab4885dSBarry Smith 44421cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4443d67d9f35SJunchao Zhang @*/ 4444d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array) 4445d71ae5a4SJacob Faibussowitsch { 4446d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4447d67d9f35SJunchao Zhang 4448d67d9f35SJunchao Zhang PetscFunctionBegin; 4449d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44509566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4451d67d9f35SJunchao Zhang } else { 4452d67d9f35SJunchao Zhang *array = NULL; 4453d67d9f35SJunchao Zhang } 44549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44559566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44578c778c55SBarry Smith } 44588c778c55SBarry Smith 445921e72a00SBarry Smith /*@C 446011a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44618f1ea47aSStefano Zampini 44620ab4885dSBarry Smith Not Collective; No Fortran Support 44638f1ea47aSStefano Zampini 44648f1ea47aSStefano Zampini Input Parameter: 4465fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44668f1ea47aSStefano Zampini 44678f1ea47aSStefano Zampini Output Parameter: 44688f1ea47aSStefano Zampini . array - pointer to the data 44698f1ea47aSStefano Zampini 44708f1ea47aSStefano Zampini Level: intermediate 44718f1ea47aSStefano Zampini 44721cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44738f1ea47aSStefano Zampini @*/ 4474d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array) 4475d71ae5a4SJacob Faibussowitsch { 4476d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44778f1ea47aSStefano Zampini 44788f1ea47aSStefano Zampini PetscFunctionBegin; 4479d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44809566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4481d67d9f35SJunchao Zhang } else { 4482d67d9f35SJunchao Zhang *array = aij->a; 4483d67d9f35SJunchao Zhang } 44843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44858f1ea47aSStefano Zampini } 44868f1ea47aSStefano Zampini 44878f1ea47aSStefano Zampini /*@C 448811a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44898f1ea47aSStefano Zampini 44900ab4885dSBarry Smith Not Collective; No Fortran Support 44918f1ea47aSStefano Zampini 44928f1ea47aSStefano Zampini Input Parameter: 4493fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44948f1ea47aSStefano Zampini 44958f1ea47aSStefano Zampini Output Parameter: 44968f1ea47aSStefano Zampini . array - pointer to the data 44978f1ea47aSStefano Zampini 44988f1ea47aSStefano Zampini Level: intermediate 44998f1ea47aSStefano Zampini 45001cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45018f1ea47aSStefano Zampini @*/ 4502d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array) 4503d71ae5a4SJacob Faibussowitsch { 4504d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 45058f1ea47aSStefano Zampini 45068f1ea47aSStefano Zampini PetscFunctionBegin; 4507d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 45089566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4509d67d9f35SJunchao Zhang } else { 4510d67d9f35SJunchao Zhang *array = NULL; 4511d67d9f35SJunchao Zhang } 45123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4513d67d9f35SJunchao Zhang } 4514d67d9f35SJunchao Zhang 4515d67d9f35SJunchao Zhang /*@C 451611a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4517d67d9f35SJunchao Zhang 45180ab4885dSBarry Smith Not Collective; No Fortran Support 4519d67d9f35SJunchao Zhang 4520d67d9f35SJunchao Zhang Input Parameter: 4521fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 4522d67d9f35SJunchao Zhang 4523d67d9f35SJunchao Zhang Output Parameter: 4524d67d9f35SJunchao Zhang . array - pointer to the data 4525d67d9f35SJunchao Zhang 4526d67d9f35SJunchao Zhang Level: intermediate 4527d67d9f35SJunchao Zhang 45281cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4529d67d9f35SJunchao Zhang @*/ 4530d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array) 4531d71ae5a4SJacob Faibussowitsch { 4532d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4533d67d9f35SJunchao Zhang 4534d67d9f35SJunchao Zhang PetscFunctionBegin; 4535d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45369566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4537d67d9f35SJunchao Zhang } else { 4538d67d9f35SJunchao Zhang *array = aij->a; 4539d67d9f35SJunchao Zhang } 45409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45419566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 45423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4543d67d9f35SJunchao Zhang } 4544d67d9f35SJunchao Zhang 4545d67d9f35SJunchao Zhang /*@C 4546d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4547d67d9f35SJunchao Zhang 45480ab4885dSBarry Smith Not Collective; No Fortran Support 4549d67d9f35SJunchao Zhang 4550d67d9f35SJunchao Zhang Input Parameter: 4551fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix 4552d67d9f35SJunchao Zhang 4553d67d9f35SJunchao Zhang Output Parameter: 4554d67d9f35SJunchao Zhang . array - pointer to the data 4555d67d9f35SJunchao Zhang 4556d67d9f35SJunchao Zhang Level: intermediate 4557d67d9f35SJunchao Zhang 45581cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4559d67d9f35SJunchao Zhang @*/ 4560d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array) 4561d71ae5a4SJacob Faibussowitsch { 4562d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4563d67d9f35SJunchao Zhang 4564d67d9f35SJunchao Zhang PetscFunctionBegin; 4565d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45669566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4567d67d9f35SJunchao Zhang } else { 4568d67d9f35SJunchao Zhang *array = NULL; 4569d67d9f35SJunchao Zhang } 45703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45718f1ea47aSStefano Zampini } 45728f1ea47aSStefano Zampini 45738f1ea47aSStefano Zampini /*@C 457411a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45757ee59b9bSJunchao Zhang 45760ab4885dSBarry Smith Not Collective; No Fortran Support 45777ee59b9bSJunchao Zhang 45787ee59b9bSJunchao Zhang Input Parameter: 457911a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45807ee59b9bSJunchao Zhang 45817ee59b9bSJunchao Zhang Output Parameters: 45827ee59b9bSJunchao Zhang + i - row map array of the matrix 45837ee59b9bSJunchao Zhang . j - column index array of the matrix 45847ee59b9bSJunchao Zhang . a - data array of the matrix 4585fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays 45867ee59b9bSJunchao Zhang 4587fe59aa6dSJacob Faibussowitsch Level: developer 45882ef1f0ffSBarry Smith 45897ee59b9bSJunchao Zhang Notes: 45902ef1f0ffSBarry Smith Any of the output parameters can be `NULL`, in which case the corresponding value is not returned. 45917ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45927ee59b9bSJunchao Zhang 45937ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45942ef1f0ffSBarry Smith If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix. 45957ee59b9bSJunchao Zhang 45961cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45977ee59b9bSJunchao Zhang @*/ 4598d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype) 4599d71ae5a4SJacob Faibussowitsch { 46007ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 46017ee59b9bSJunchao Zhang 46027ee59b9bSJunchao Zhang PetscFunctionBegin; 46037ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 46047ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 46057ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 46067ee59b9bSJunchao Zhang } else { 46077ee59b9bSJunchao Zhang if (i) *i = aij->i; 46087ee59b9bSJunchao Zhang if (j) *j = aij->j; 46097ee59b9bSJunchao Zhang if (a) *a = aij->a; 46107ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 46117ee59b9bSJunchao Zhang } 46123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 46137ee59b9bSJunchao Zhang } 46147ee59b9bSJunchao Zhang 46157ee59b9bSJunchao Zhang /*@C 461621e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 461721e72a00SBarry Smith 461821e72a00SBarry Smith Not Collective 461921e72a00SBarry Smith 462021e72a00SBarry Smith Input Parameter: 4621fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 462221e72a00SBarry Smith 462321e72a00SBarry Smith Output Parameter: 462421e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 462521e72a00SBarry Smith 462621e72a00SBarry Smith Level: intermediate 462721e72a00SBarry Smith 46281cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 462921e72a00SBarry Smith @*/ 4630d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4631d71ae5a4SJacob Faibussowitsch { 463221e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 463321e72a00SBarry Smith 463421e72a00SBarry Smith PetscFunctionBegin; 463521e72a00SBarry Smith *nz = aij->rmax; 46363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 463721e72a00SBarry Smith } 463821e72a00SBarry Smith 46392c4ab24aSJunchao Zhang static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void *data) 46402c4ab24aSJunchao Zhang { 46412c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)data; 46424d86920dSPierre Jolivet 46432c4ab24aSJunchao Zhang PetscFunctionBegin; 46442c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->perm)); 46452c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->jmap)); 46462c4ab24aSJunchao Zhang PetscCall(PetscFree(coo)); 46472c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS); 46482c4ab24aSJunchao Zhang } 46492c4ab24aSJunchao Zhang 4650d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4651d71ae5a4SJacob Faibussowitsch { 4652394ed5ebSJunchao Zhang MPI_Comm comm; 4653394ed5ebSJunchao Zhang PetscInt *i, *j; 46540d88f7f4SJunchao Zhang PetscInt M, N, row, iprev; 4655394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4656394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4657394ed5ebSJunchao Zhang PetscInt *Aj; 4658394ed5ebSJunchao Zhang PetscScalar *Aa; 4659f4f49eeaSPierre Jolivet Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)mat->data; 4660cbc6b225SStefano Zampini MatType rtype; 4661394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 46622c4ab24aSJunchao Zhang PetscContainer container; 46632c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 46640d88f7f4SJunchao Zhang PetscBool isorted; 4665394ed5ebSJunchao Zhang 4666394ed5ebSJunchao Zhang PetscFunctionBegin; 46679566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46689566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4669e8729f6fSJunchao Zhang i = coo_i; 4670e8729f6fSJunchao Zhang j = coo_j; 46719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 46720d88f7f4SJunchao Zhang 46730d88f7f4SJunchao Zhang /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */ 46740d88f7f4SJunchao Zhang isorted = PETSC_TRUE; 46750d88f7f4SJunchao Zhang iprev = PETSC_INT_MIN; 46760d88f7f4SJunchao Zhang for (k = 0; k < coo_n; k++) { 4677394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 46780d88f7f4SJunchao Zhang if (isorted) { 46790d88f7f4SJunchao Zhang if (i[k] < iprev) isorted = PETSC_FALSE; 46800d88f7f4SJunchao Zhang else iprev = i[k]; 46810d88f7f4SJunchao Zhang } 4682394ed5ebSJunchao Zhang perm[k] = k; 4683394ed5ebSJunchao Zhang } 4684394ed5ebSJunchao Zhang 46850d88f7f4SJunchao Zhang /* Sort by row if not already */ 46860d88f7f4SJunchao Zhang if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 4687651b1cf9SStefano Zampini 4688651b1cf9SStefano Zampini /* Advance k to the first row with a non-negative index */ 4689651b1cf9SStefano Zampini for (k = 0; k < coo_n; k++) 46909371c9d4SSatish Balay if (i[k] >= 0) break; 4691394ed5ebSJunchao Zhang nneg = k; 46929566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4693394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 469435cb6cd3SPierre Jolivet jmap++; /* Inc jmap by 1 for convenience */ 4695394ed5ebSJunchao Zhang 46969566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M + 1, &Ai)); /* CSR of A */ 46979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4698394ed5ebSJunchao Zhang 4699651b1cf9SStefano Zampini /* Support for HYPRE */ 4700651b1cf9SStefano Zampini PetscBool hypre; 4701651b1cf9SStefano Zampini const char *name; 4702651b1cf9SStefano Zampini PetscCall(PetscObjectGetName((PetscObject)mat, &name)); 4703651b1cf9SStefano Zampini PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre)); 4704651b1cf9SStefano Zampini 4705394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 470635cb6cd3SPierre Jolivet Ai++; /* Inc by 1 for convenience */ 4707394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4708394ed5ebSJunchao Zhang while (k < coo_n) { 47090d88f7f4SJunchao Zhang PetscBool strictly_sorted; // this row is strictly sorted? 47100d88f7f4SJunchao Zhang PetscInt jprev; 47110d88f7f4SJunchao Zhang 47120d88f7f4SJunchao Zhang /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */ 4713394ed5ebSJunchao Zhang row = i[k]; 47140d88f7f4SJunchao Zhang start = k; 47150d88f7f4SJunchao Zhang jprev = PETSC_INT_MIN; 47160d88f7f4SJunchao Zhang strictly_sorted = PETSC_TRUE; 47170d88f7f4SJunchao Zhang while (k < coo_n && i[k] == row) { 47180d88f7f4SJunchao Zhang if (strictly_sorted) { 47190d88f7f4SJunchao Zhang if (j[k] <= jprev) strictly_sorted = PETSC_FALSE; 47200d88f7f4SJunchao Zhang else jprev = j[k]; 47210d88f7f4SJunchao Zhang } 47220d88f7f4SJunchao Zhang k++; 47230d88f7f4SJunchao Zhang } 4724394ed5ebSJunchao Zhang end = k; 47250d88f7f4SJunchao Zhang 4726651b1cf9SStefano Zampini /* hack for HYPRE: swap min column to diag so that diagonal values will go first */ 4727651b1cf9SStefano Zampini if (hypre) { 4728651b1cf9SStefano Zampini PetscInt minj = PETSC_MAX_INT; 4729651b1cf9SStefano Zampini PetscBool hasdiag = PETSC_FALSE; 47300d88f7f4SJunchao Zhang 47310d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to swap the first and the diag 47320d88f7f4SJunchao Zhang PetscCount tmp; 47330d88f7f4SJunchao Zhang for (p = start; p < end; p++) { 47340d88f7f4SJunchao Zhang if (j[p] == row && p != start) { 47350d88f7f4SJunchao Zhang j[p] = j[start]; 47360d88f7f4SJunchao Zhang j[start] = row; 47370d88f7f4SJunchao Zhang tmp = perm[start]; 47380d88f7f4SJunchao Zhang perm[start] = perm[p]; 47390d88f7f4SJunchao Zhang perm[p] = tmp; 47400d88f7f4SJunchao Zhang break; 47410d88f7f4SJunchao Zhang } 47420d88f7f4SJunchao Zhang } 47430d88f7f4SJunchao Zhang } else { 4744651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4745651b1cf9SStefano Zampini hasdiag = (PetscBool)(hasdiag || (j[p] == row)); 4746651b1cf9SStefano Zampini minj = PetscMin(minj, j[p]); 4747651b1cf9SStefano Zampini } 47480d88f7f4SJunchao Zhang 4749651b1cf9SStefano Zampini if (hasdiag) { 4750651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4751651b1cf9SStefano Zampini if (j[p] == minj) j[p] = row; 4752651b1cf9SStefano Zampini else if (j[p] == row) j[p] = minj; 4753651b1cf9SStefano Zampini } 4754651b1cf9SStefano Zampini } 4755651b1cf9SStefano Zampini } 47560d88f7f4SJunchao Zhang } 47570d88f7f4SJunchao Zhang // sort by columns in a row 47580d88f7f4SJunchao Zhang if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4759651b1cf9SStefano Zampini 47600d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q 47610d88f7f4SJunchao Zhang for (p = start; p < end; p++, q++) { 47620d88f7f4SJunchao Zhang Aj[q] = j[p]; 47630d88f7f4SJunchao Zhang jmap[q] = 1; 47640d88f7f4SJunchao Zhang } 47650d88f7f4SJunchao Zhang Ai[row] = end - start; 47660d88f7f4SJunchao Zhang nnz += Ai[row]; // q is already advanced 47670d88f7f4SJunchao Zhang } else { 4768394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4769394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4770651b1cf9SStefano Zampini jmap[q] = 1; /* Number of repeats of this nonzero entry */ 4771394ed5ebSJunchao Zhang Ai[row] = 1; 4772394ed5ebSJunchao Zhang nnz++; 4773394ed5ebSJunchao Zhang 4774394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4775394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4776394ed5ebSJunchao Zhang q++; 4777394ed5ebSJunchao Zhang jmap[q] = 1; 4778394ed5ebSJunchao Zhang Aj[q] = j[p]; 4779394ed5ebSJunchao Zhang Ai[row]++; 4780394ed5ebSJunchao Zhang nnz++; 4781394ed5ebSJunchao Zhang } else { 4782394ed5ebSJunchao Zhang jmap[q]++; 4783394ed5ebSJunchao Zhang } 4784394ed5ebSJunchao Zhang } 4785394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4786394ed5ebSJunchao Zhang } 47870d88f7f4SJunchao Zhang } 47880d88f7f4SJunchao Zhang 4789394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4790394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 47910d88f7f4SJunchao Zhang jmap--; // Back to the beginning of jmap[] 4792394ed5ebSJunchao Zhang jmap[0] = 0; 4793394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 47940d88f7f4SJunchao Zhang 4795394ed5ebSJunchao Zhang if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */ 4796394ed5ebSJunchao Zhang PetscCount *jmap_new; 4797394ed5ebSJunchao Zhang PetscInt *Aj_new; 4798394ed5ebSJunchao Zhang 47999566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 48009566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 48019566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4802394ed5ebSJunchao Zhang jmap = jmap_new; 4803394ed5ebSJunchao Zhang 48049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &Aj_new)); 48059566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 48069566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4807394ed5ebSJunchao Zhang Aj = Aj_new; 4808394ed5ebSJunchao Zhang } 4809394ed5ebSJunchao Zhang 4810394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4811394ed5ebSJunchao Zhang PetscCount *perm_new; 4812cbc6b225SStefano Zampini 48139566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 48149566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 48159566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4816394ed5ebSJunchao Zhang perm = perm_new; 4817394ed5ebSJunchao Zhang } 4818394ed5ebSJunchao Zhang 48199566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 48209566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */ 48219566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4822394ed5ebSJunchao Zhang 4823394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4824394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 48252c4ab24aSJunchao Zhang 48262c4ab24aSJunchao Zhang // Put the COO struct in a container and then attach that to the matrix 48272c4ab24aSJunchao Zhang PetscCall(PetscMalloc1(1, &coo)); 48282c4ab24aSJunchao Zhang coo->nz = nnz; 48292c4ab24aSJunchao Zhang coo->n = coo_n; 48302c4ab24aSJunchao Zhang coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again 48312c4ab24aSJunchao Zhang coo->jmap = jmap; // of length nnz+1 48322c4ab24aSJunchao Zhang coo->perm = perm; 48332c4ab24aSJunchao Zhang PetscCall(PetscContainerCreate(PETSC_COMM_SELF, &container)); 48342c4ab24aSJunchao Zhang PetscCall(PetscContainerSetPointer(container, coo)); 48352c4ab24aSJunchao Zhang PetscCall(PetscContainerSetUserDestroy(container, MatCOOStructDestroy_SeqAIJ)); 48362c4ab24aSJunchao Zhang PetscCall(PetscObjectCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", (PetscObject)container)); 48372c4ab24aSJunchao Zhang PetscCall(PetscContainerDestroy(&container)); 48383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4839394ed5ebSJunchao Zhang } 4840394ed5ebSJunchao Zhang 4841d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4842d71ae5a4SJacob Faibussowitsch { 4843394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4844394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 48452c4ab24aSJunchao Zhang PetscCount *perm, *jmap; 4846394ed5ebSJunchao Zhang PetscScalar *Aa; 48472c4ab24aSJunchao Zhang PetscContainer container; 48482c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 4849394ed5ebSJunchao Zhang 4850394ed5ebSJunchao Zhang PetscFunctionBegin; 48512c4ab24aSJunchao Zhang PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container)); 48522c4ab24aSJunchao Zhang PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix"); 48532c4ab24aSJunchao Zhang PetscCall(PetscContainerGetPointer(container, (void **)&coo)); 48542c4ab24aSJunchao Zhang perm = coo->perm; 48552c4ab24aSJunchao Zhang jmap = coo->jmap; 48569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4857394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4858b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4859b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4860b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4861394ed5ebSJunchao Zhang } 48629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 48633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4864394ed5ebSJunchao Zhang } 4865394ed5ebSJunchao Zhang 486634b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48675063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 486802fe1965SBarry Smith #endif 4869d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4870d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *); 4871d5e393b6SSuyash Tandon #endif 48723d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48735063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 48743d0639e7SStefano Zampini #endif 487502fe1965SBarry Smith 4876d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4877d71ae5a4SJacob Faibussowitsch { 4878273d9f13SBarry Smith Mat_SeqAIJ *b; 487938baddfdSBarry Smith PetscMPIInt size; 4880273d9f13SBarry Smith 4881273d9f13SBarry Smith PetscFunctionBegin; 48829566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 488308401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4884273d9f13SBarry Smith 48854dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 48862205254eSKarl Rupp 4887b0a32e0cSBarry Smith B->data = (void *)b; 4888aea10558SJacob Faibussowitsch B->ops[0] = MatOps_Values; 4889071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 48902205254eSKarl Rupp 4891f4259b30SLisandro Dalcin b->row = NULL; 4892f4259b30SLisandro Dalcin b->col = NULL; 4893f4259b30SLisandro Dalcin b->icol = NULL; 4894b810aeb4SBarry Smith b->reallocs = 0; 489536db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4896f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4897416022c9SBarry Smith b->nonew = 0; 4898f4259b30SLisandro Dalcin b->diag = NULL; 4899f4259b30SLisandro Dalcin b->solve_work = NULL; 4900f4259b30SLisandro Dalcin B->spptr = NULL; 4901f4259b30SLisandro Dalcin b->saved_values = NULL; 4902f4259b30SLisandro Dalcin b->idiag = NULL; 4903f4259b30SLisandro Dalcin b->mdiag = NULL; 4904f4259b30SLisandro Dalcin b->ssor_work = NULL; 490571f1c65dSBarry Smith b->omega = 1.0; 490671f1c65dSBarry Smith b->fshift = 0.0; 490771f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4908bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4909a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 491017ab2063SBarry Smith 49119566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4912d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 49139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 49149566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4915b3866ffcSBarry Smith #endif 49169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 49179566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 49189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 49199566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 49209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 49219566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 49229566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 49239779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 49249566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4925191b95cbSRichard Tran Mills #endif 492634b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 49279566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 49289566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49299566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 493002fe1965SBarry Smith #endif 4931d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4932d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 4933d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 4934d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ)); 4935d5e393b6SSuyash Tandon #endif 49363d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 49379566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 49383d0639e7SStefano Zampini #endif 49399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4940af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 49419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4942af8000cdSHong Zhang #endif 4943d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 49449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4945d24d4204SJose E. Roman #endif 494663c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 49479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 49489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 494963c07aadSStefano Zampini #endif 49509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 49519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 49529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 49539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 495414e4dea2SJose E. Roman PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ)); 49559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 49569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 49579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 49589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 49599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 49609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 49619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 49639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 49649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 49659566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 49669566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 49679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 49683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 496917ab2063SBarry Smith } 497017ab2063SBarry Smith 4971b24902e0SBarry Smith /* 49723893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4973b24902e0SBarry Smith */ 4974d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4975d71ae5a4SJacob Faibussowitsch { 49762a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4977071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 497817ab2063SBarry Smith 49793a40ed3dSBarry Smith PetscFunctionBegin; 4980aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4981273d9f13SBarry Smith 4982d5f3da31SBarry Smith C->factortype = A->factortype; 4983f4259b30SLisandro Dalcin c->row = NULL; 4984f4259b30SLisandro Dalcin c->col = NULL; 4985f4259b30SLisandro Dalcin c->icol = NULL; 49866ad4291fSHong Zhang c->reallocs = 0; 4987bc43efbbSJunchao Zhang c->diagonaldense = a->diagonaldense; 498817ab2063SBarry Smith 498969272f91SPierre Jolivet C->assembled = A->assembled; 499017ab2063SBarry Smith 499169272f91SPierre Jolivet if (A->preallocated) { 49929566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 49939566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4994eec197d1SBarry Smith 499531fe6a7dSBarry Smith if (!A->hash_active) { 49969566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 49979566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 49989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 49999566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 500017ab2063SBarry Smith 500117ab2063SBarry Smith /* allocate the matrix space */ 5002f77e22a1SHong Zhang if (mallocmatspace) { 50039566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i)); 50042205254eSKarl Rupp 5005f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 50062205254eSKarl Rupp 50079566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 500817ab2063SBarry Smith if (m > 0) { 50099566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 5010be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 50112e5835c6SStefano Zampini const PetscScalar *aa; 50122e5835c6SStefano Zampini 50139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50149566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 50159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 5016be6bf707SBarry Smith } else { 50179566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 501817ab2063SBarry Smith } 501908480c60SBarry Smith } 5020f77e22a1SHong Zhang } 502131fe6a7dSBarry Smith C->preallocated = PETSC_TRUE; 502231fe6a7dSBarry Smith } else { 502331fe6a7dSBarry Smith PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix"); 502431fe6a7dSBarry Smith PetscCall(MatSetUp(C)); 502531fe6a7dSBarry Smith } 502617ab2063SBarry Smith 50276ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 5028416022c9SBarry Smith c->roworiented = a->roworiented; 5029416022c9SBarry Smith c->nonew = a->nonew; 5030416022c9SBarry Smith if (a->diag) { 50319566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 50329566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 5033071fcb05SBarry Smith } else c->diag = NULL; 50342205254eSKarl Rupp 5035f4259b30SLisandro Dalcin c->solve_work = NULL; 5036f4259b30SLisandro Dalcin c->saved_values = NULL; 5037f4259b30SLisandro Dalcin c->idiag = NULL; 5038f4259b30SLisandro Dalcin c->ssor_work = NULL; 5039a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 5040e6b907acSBarry Smith c->free_a = PETSC_TRUE; 5041e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 50426ad4291fSHong Zhang 5043893ad86cSHong Zhang c->rmax = a->rmax; 5044416022c9SBarry Smith c->nz = a->nz; 50458ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 5046754ec7b1SSatish Balay 50476ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 50486ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 5049cd6b891eSBarry Smith if (a->compressedrow.use) { 50506ad4291fSHong Zhang i = a->compressedrow.nrows; 50519566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 50529566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 50539566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 505427ea64f8SHong Zhang } else { 505527ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 50560298fd71SBarry Smith c->compressedrow.i = NULL; 50570298fd71SBarry Smith c->compressedrow.rindex = NULL; 50586ad4291fSHong Zhang } 5059ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 5060e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 50614846f1f5SKris Buschelman 50629566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 506369272f91SPierre Jolivet } 50649566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 50653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 506617ab2063SBarry Smith } 506717ab2063SBarry Smith 5068d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 5069d71ae5a4SJacob Faibussowitsch { 5070b24902e0SBarry Smith PetscFunctionBegin; 50719566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 50729566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 507348a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 50749566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 50759566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 50763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5077b24902e0SBarry Smith } 5078b24902e0SBarry Smith 5079d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 5080d71ae5a4SJacob Faibussowitsch { 508152f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 508252f91c60SVaclav Hapla 508352f91c60SVaclav Hapla PetscFunctionBegin; 508452f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 508552f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 5086c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 50879566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 50889566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 50899566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 509052f91c60SVaclav Hapla if (isbinary) { 50919566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 509252f91c60SVaclav Hapla } else if (ishdf5) { 509352f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 50949566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 509552f91c60SVaclav Hapla #else 509652f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 509752f91c60SVaclav Hapla #endif 509852f91c60SVaclav Hapla } else { 509998921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 510052f91c60SVaclav Hapla } 51013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 510252f91c60SVaclav Hapla } 510352f91c60SVaclav Hapla 5104d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 5105d71ae5a4SJacob Faibussowitsch { 51063ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 51073ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 5108fbdbba38SShri Abhyankar 5109fbdbba38SShri Abhyankar PetscFunctionBegin; 51109566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 5111bbead8a2SBarry Smith 51123ea6fe3dSLisandro Dalcin /* read in matrix header */ 51139566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 511408401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 51159371c9d4SSatish Balay M = header[1]; 51169371c9d4SSatish Balay N = header[2]; 51179371c9d4SSatish Balay nz = header[3]; 511808401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 511908401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 512008401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 5121fbdbba38SShri Abhyankar 51223ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 51239566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 51243ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 51253ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 51263ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 51273ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 51283ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 51299566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 51309566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 51313ea6fe3dSLisandro Dalcin 51323ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 51339566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5134aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51353ea6fe3dSLisandro Dalcin 5136fbdbba38SShri Abhyankar /* read in row lengths */ 51379566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 51389566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 51393ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 51409371c9d4SSatish Balay sum = 0; 51419371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 514208401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 51433ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 51449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 51459566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5146aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51473ea6fe3dSLisandro Dalcin /* store row lengths */ 51489566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 51499566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5150fbdbba38SShri Abhyankar 51513ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 51529371c9d4SSatish Balay a->i[0] = 0; 51539371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 51543ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 51559566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 51563ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 51579566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5158fbdbba38SShri Abhyankar 51599566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 51609566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 51613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5162fbdbba38SShri Abhyankar } 5163fbdbba38SShri Abhyankar 5164d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5165d71ae5a4SJacob Faibussowitsch { 51667264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5167fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5168eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5169eeffb40dSHong Zhang PetscInt k; 5170eeffb40dSHong Zhang #endif 51717264ac53SSatish Balay 51723a40ed3dSBarry Smith PetscFunctionBegin; 5173bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5174d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5175ca44d042SBarry Smith *flg = PETSC_FALSE; 51763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5177bcd2baecSBarry Smith } 51787264ac53SSatish Balay 51797264ac53SSatish Balay /* if the a->i are the same */ 51809566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 51813ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 51827264ac53SSatish Balay 51837264ac53SSatish Balay /* if a->j are the same */ 51849566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 51853ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 5186bcd2baecSBarry Smith 51879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 51889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5189bcd2baecSBarry Smith /* if a->a are the same */ 5190eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5191eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5192fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5193eeffb40dSHong Zhang *flg = PETSC_FALSE; 51943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5195eeffb40dSHong Zhang } 5196eeffb40dSHong Zhang } 5197eeffb40dSHong Zhang #else 51989566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5199eeffb40dSHong Zhang #endif 52009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 52019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 52023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52037264ac53SSatish Balay } 520436db0b34SBarry Smith 520505869f15SSatish Balay /*@ 520611a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 520736db0b34SBarry Smith provided by the user. 520836db0b34SBarry Smith 5209d083f849SBarry Smith Collective 521036db0b34SBarry Smith 521136db0b34SBarry Smith Input Parameters: 521236db0b34SBarry Smith + comm - must be an MPI communicator of size 1 521336db0b34SBarry Smith . m - number of rows 521436db0b34SBarry Smith . n - number of columns 5215483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 521636db0b34SBarry Smith . j - column indices 521736db0b34SBarry Smith - a - matrix values 521836db0b34SBarry Smith 521936db0b34SBarry Smith Output Parameter: 522036db0b34SBarry Smith . mat - the matrix 522136db0b34SBarry Smith 522236db0b34SBarry Smith Level: intermediate 522336db0b34SBarry Smith 522436db0b34SBarry Smith Notes: 52252ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 5226292fb18eSBarry Smith once the matrix is destroyed and not before 522736db0b34SBarry Smith 522836db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 522936db0b34SBarry Smith 52302ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 523136db0b34SBarry Smith 5232a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5233a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 52348eef79e4SBarry Smith as shown 52352ef1f0ffSBarry Smith .vb 52362ef1f0ffSBarry Smith 1 0 0 52372ef1f0ffSBarry Smith 2 0 3 52382ef1f0ffSBarry Smith 4 5 6 5239a4552177SSatish Balay 52402ef1f0ffSBarry Smith i = {0,1,3,6} [size = nrow+1 = 3+1] 52412ef1f0ffSBarry Smith j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 52422ef1f0ffSBarry Smith v = {1,2,3,4,5,6} [size = 6] 52432ef1f0ffSBarry Smith .ve 5244a4552177SSatish Balay 52451cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 524636db0b34SBarry Smith @*/ 5247d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5248d71ae5a4SJacob Faibussowitsch { 5249cbcfb4deSHong Zhang PetscInt ii; 525036db0b34SBarry Smith Mat_SeqAIJ *aij; 5251cbcfb4deSHong Zhang PetscInt jj; 525236db0b34SBarry Smith 525336db0b34SBarry Smith PetscFunctionBegin; 5254aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 52559566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 52569566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 52579566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 52589566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 52599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5260ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 52619566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 52629566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5263ab93d7beSBarry Smith 526436db0b34SBarry Smith aij->i = i; 526536db0b34SBarry Smith aij->j = j; 526636db0b34SBarry Smith aij->a = a; 526736db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 526836db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5269e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5270e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 527136db0b34SBarry Smith 5272cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 527336db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 527476bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5275aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 52769985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 527708401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 527808401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 52799985e31cSBarry Smith } 528036db0b34SBarry Smith } 528176bd3646SJed Brown } 528276bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 528336db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 528408401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5285da0802e2SStefano Zampini PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1); 528636db0b34SBarry Smith } 528776bd3646SJed Brown } 528836db0b34SBarry Smith 52899566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52909566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 529236db0b34SBarry Smith } 5293cbc6b225SStefano Zampini 5294f62e3866SBarry Smith /*@ 529511a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 52968a0b0e6bSVictor Minden provided by the user. 52978a0b0e6bSVictor Minden 5298d083f849SBarry Smith Collective 52998a0b0e6bSVictor Minden 53008a0b0e6bSVictor Minden Input Parameters: 53018a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 53028a0b0e6bSVictor Minden . m - number of rows 53038a0b0e6bSVictor Minden . n - number of columns 53048a0b0e6bSVictor Minden . i - row indices 53058a0b0e6bSVictor Minden . j - column indices 53061230e6d1SVictor Minden . a - matrix values 53071230e6d1SVictor Minden . nz - number of nonzeros 53082ef1f0ffSBarry Smith - idx - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 53098a0b0e6bSVictor Minden 53108a0b0e6bSVictor Minden Output Parameter: 53118a0b0e6bSVictor Minden . mat - the matrix 53128a0b0e6bSVictor Minden 53138a0b0e6bSVictor Minden Level: intermediate 53148a0b0e6bSVictor Minden 5315f62e3866SBarry Smith Example: 5316f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 53179e99939fSJunchao Zhang .vb 53188a0b0e6bSVictor Minden 1 0 0 53198a0b0e6bSVictor Minden 2 0 3 53208a0b0e6bSVictor Minden 4 5 6 53218a0b0e6bSVictor Minden 53228a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 53238a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 53248a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 53259e99939fSJunchao Zhang .ve 5326fe59aa6dSJacob Faibussowitsch 53272ef1f0ffSBarry Smith Note: 5328d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5329d7547e51SJunchao Zhang and are particularly useful in iterative applications. 53308a0b0e6bSVictor Minden 53311cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 53328a0b0e6bSVictor Minden @*/ 5333d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5334d71ae5a4SJacob Faibussowitsch { 5335d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 53368a0b0e6bSVictor Minden 53378a0b0e6bSVictor Minden PetscFunctionBegin; 53389566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5339ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 53409566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 53419566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 53429566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 53439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 53441230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 53451230e6d1SVictor Minden if (idx) { 53461230e6d1SVictor Minden row = i[ii] - 1; 53471230e6d1SVictor Minden col = j[ii] - 1; 53481230e6d1SVictor Minden } else { 53491230e6d1SVictor Minden row = i[ii]; 53501230e6d1SVictor Minden col = j[ii]; 53518a0b0e6bSVictor Minden } 53529566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 53538a0b0e6bSVictor Minden } 53549566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 53559566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 53569566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 53573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53588a0b0e6bSVictor Minden } 535936db0b34SBarry Smith 5360d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5361d71ae5a4SJacob Faibussowitsch { 5362acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5363acf2f550SJed Brown 5364acf2f550SJed Brown PetscFunctionBegin; 5365acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5366acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 53672205254eSKarl Rupp 53689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 53693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5370acf2f550SJed Brown } 5371acf2f550SJed Brown 5372d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5373d71ae5a4SJacob Faibussowitsch { 53749c8f2541SHong Zhang PetscFunctionBegin; 53759566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 53763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53779c8f2541SHong Zhang } 53789c8f2541SHong Zhang 537981824310SBarry Smith /* 538053dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 538153dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 538253dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 538353dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 538453dd7562SDmitry Karpeev */ 5385d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5386d71ae5a4SJacob Faibussowitsch { 538753dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 538853dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 538953dd7562SDmitry Karpeev PetscBool seqaij; 539053dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 539153dd7562SDmitry Karpeev PetscScalar v; 539253dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 539353dd7562SDmitry Karpeev 539453dd7562SDmitry Karpeev PetscFunctionBegin; 53953ba16761SJacob Faibussowitsch if (!B) PetscFunctionReturn(PETSC_SUCCESS); 539653dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 53979566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 539828b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 539953dd7562SDmitry Karpeev if (rowemb) { 54009566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 540108401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 540253dd7562SDmitry Karpeev } else { 540308401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 540453dd7562SDmitry Karpeev } 540553dd7562SDmitry Karpeev if (colemb) { 54069566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 540708401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 540853dd7562SDmitry Karpeev } else { 540908401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 541053dd7562SDmitry Karpeev } 541153dd7562SDmitry Karpeev 5412f4f49eeaSPierre Jolivet Baij = (Mat_SeqAIJ *)B->data; 541353dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 54149566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5415ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 54169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 54179566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 541853dd7562SDmitry Karpeev } 541948a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 542053dd7562SDmitry Karpeev count = 0; 542153dd7562SDmitry Karpeev rowindices = NULL; 542253dd7562SDmitry Karpeev colindices = NULL; 542348a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 542448a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 542553dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 542653dd7562SDmitry Karpeev PetscInt row; 542753dd7562SDmitry Karpeev row = i; 542853dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 542953dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 543053dd7562SDmitry Karpeev PetscInt col; 543153dd7562SDmitry Karpeev col = Baij->j[count]; 543253dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 543353dd7562SDmitry Karpeev v = Baij->a[count]; 54349566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 543553dd7562SDmitry Karpeev ++count; 543653dd7562SDmitry Karpeev } 543753dd7562SDmitry Karpeev } 543853dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 543953dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 544053dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 544153dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 544253dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 54433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 544453dd7562SDmitry Karpeev } 544553dd7562SDmitry Karpeev 544658c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep) 5447dec0b466SHong Zhang { 5448dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5449dec0b466SHong Zhang MatScalar *aa = a->a; 5450dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5451dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5452dec0b466SHong Zhang 5453dec0b466SHong Zhang PetscFunctionBegin; 5454dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5455dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5456dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5457dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5458dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 545958c11ad4SPierre Jolivet if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++; 5460dec0b466SHong Zhang else { 5461dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5462dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5463dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5464dec0b466SHong Zhang } 5465dec0b466SHong Zhang } 5466dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5467dec0b466SHong Zhang fshift_prev = fshift; 5468dec0b466SHong Zhang /* reset ilen and imax for each row */ 5469dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5470dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5471dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5472dec0b466SHong Zhang } 5473312eded4SPierre Jolivet if (fshift) { 5474dec0b466SHong Zhang if (m) { 5475dec0b466SHong Zhang ai[m] -= fshift; 5476dec0b466SHong Zhang a->nz = ai[m]; 5477dec0b466SHong Zhang } 5478dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5479312eded4SPierre Jolivet A->nonzerostate++; 5480dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5481dec0b466SHong Zhang a->rmax = rmax; 5482dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5483dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5484dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 5485312eded4SPierre Jolivet } 54863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5487dec0b466SHong Zhang } 5488dec0b466SHong Zhang 54894099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 54904099cc6bSBarry Smith 54914099cc6bSBarry Smith /*@C 549211a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 54934099cc6bSBarry Smith 5494c3339decSBarry Smith Collective 54954099cc6bSBarry Smith 54964099cc6bSBarry Smith Input Parameters: 54974099cc6bSBarry Smith + mat - the matrix object 54984099cc6bSBarry Smith - matype - matrix type 54994099cc6bSBarry Smith 55004099cc6bSBarry Smith Options Database Key: 55014e187271SRichard Tran Mills . -mat_seqaij_type <method> - for example seqaijcrl 55024099cc6bSBarry Smith 55034099cc6bSBarry Smith Level: intermediate 55044099cc6bSBarry Smith 5505fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType` 55064099cc6bSBarry Smith @*/ 5507d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5508d71ae5a4SJacob Faibussowitsch { 55094099cc6bSBarry Smith PetscBool sametype; 55105f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 55114099cc6bSBarry Smith 55124099cc6bSBarry Smith PetscFunctionBegin; 55134099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 55149566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 55153ba16761SJacob Faibussowitsch if (sametype) PetscFunctionReturn(PETSC_SUCCESS); 55164099cc6bSBarry Smith 55179566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 55186adde796SStefano Zampini PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 55199566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 55203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55214099cc6bSBarry Smith } 55224099cc6bSBarry Smith 55234099cc6bSBarry Smith /*@C 552411a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 55254099cc6bSBarry Smith 55264099cc6bSBarry Smith Not Collective 55274099cc6bSBarry Smith 55284099cc6bSBarry Smith Input Parameters: 5529fe59aa6dSJacob Faibussowitsch + sname - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 55304099cc6bSBarry Smith - function - routine to convert to subtype 55314099cc6bSBarry Smith 55322ef1f0ffSBarry Smith Level: advanced 55332ef1f0ffSBarry Smith 55344099cc6bSBarry Smith Notes: 553511a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 55364099cc6bSBarry Smith 55374099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 55384099cc6bSBarry Smith $ -mat_seqaij_type my_mat 55394099cc6bSBarry Smith 55401cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()` 55414099cc6bSBarry Smith @*/ 5542d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5543d71ae5a4SJacob Faibussowitsch { 55444099cc6bSBarry Smith PetscFunctionBegin; 55459566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 55469566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 55473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55484099cc6bSBarry Smith } 55494099cc6bSBarry Smith 55504099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 55514099cc6bSBarry Smith 55524099cc6bSBarry Smith /*@C 555311a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 55544099cc6bSBarry Smith 55554099cc6bSBarry Smith Not Collective 55564099cc6bSBarry Smith 55574099cc6bSBarry Smith Level: advanced 55584099cc6bSBarry Smith 55592ef1f0ffSBarry Smith Note: 55602ef1f0ffSBarry Smith This registers the versions of `MATSEQAIJ` for GPUs 55612ef1f0ffSBarry Smith 55621cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()` 55634099cc6bSBarry Smith @*/ 5564d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5565d71ae5a4SJacob Faibussowitsch { 55664099cc6bSBarry Smith PetscFunctionBegin; 55673ba16761SJacob Faibussowitsch if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS); 55684099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 55694099cc6bSBarry Smith 55709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 55719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 55729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 55739779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 55749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5575485f9817SRichard Tran Mills #endif 55765063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 55779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 55785063d097SStefano Zampini #endif 5579d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 5580d5e393b6SSuyash Tandon PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 5581d5e393b6SSuyash Tandon #endif 55825063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 55839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 55845063d097SStefano Zampini #endif 55854099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 55869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 55874099cc6bSBarry Smith #endif 55883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55894099cc6bSBarry Smith } 559053dd7562SDmitry Karpeev 559153dd7562SDmitry Karpeev /* 559281824310SBarry Smith Special version for direct calls from Fortran 559381824310SBarry Smith */ 5594af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 559581824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 559681824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 559781824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 559881824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 559981824310SBarry Smith #endif 560081824310SBarry Smith 560181824310SBarry Smith /* Change these macros so can be used in void function */ 560298921bdaSJacob Faibussowitsch 560398921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 56049566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 56059566063dSJacob Faibussowitsch #undef PetscCall 56069371c9d4SSatish Balay #define PetscCall(...) \ 56079371c9d4SSatish Balay do { \ 56085f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 560998921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 561098921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 561198921bdaSJacob Faibussowitsch return; \ 561298921bdaSJacob Faibussowitsch } \ 561398921bdaSJacob Faibussowitsch } while (0) 561498921bdaSJacob Faibussowitsch 561598921bdaSJacob Faibussowitsch #undef SETERRQ 56169371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 56179371c9d4SSatish Balay do { \ 561898921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 561998921bdaSJacob Faibussowitsch return; \ 562098921bdaSJacob Faibussowitsch } while (0) 562181824310SBarry Smith 5622d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5623d71ae5a4SJacob Faibussowitsch { 562481824310SBarry Smith Mat A = *AA; 562581824310SBarry Smith PetscInt m = *mm, n = *nn; 562681824310SBarry Smith InsertMode is = *isis; 562781824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 562881824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 562981824310SBarry Smith PetscInt *imax, *ai, *ailen; 563081824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 563154f21887SBarry Smith MatScalar *ap, value, *aa; 5632ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5633ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 563481824310SBarry Smith 563581824310SBarry Smith PetscFunctionBegin; 56364994cf47SJed Brown MatCheckPreallocated(A, 1); 563781824310SBarry Smith imax = a->imax; 563881824310SBarry Smith ai = a->i; 563981824310SBarry Smith ailen = a->ilen; 564081824310SBarry Smith aj = a->j; 564181824310SBarry Smith aa = a->a; 564281824310SBarry Smith 564381824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 564481824310SBarry Smith row = im[k]; 564581824310SBarry Smith if (row < 0) continue; 56465f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 56479371c9d4SSatish Balay rp = aj + ai[row]; 56489371c9d4SSatish Balay ap = aa + ai[row]; 56499371c9d4SSatish Balay rmax = imax[row]; 56509371c9d4SSatish Balay nrow = ailen[row]; 565181824310SBarry Smith low = 0; 565281824310SBarry Smith high = nrow; 565381824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 565481824310SBarry Smith if (in[l] < 0) continue; 56555f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 565681824310SBarry Smith col = in[l]; 56572205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 56582205254eSKarl Rupp else value = v[k + l * m]; 56592205254eSKarl Rupp 566081824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 566181824310SBarry Smith 56622205254eSKarl Rupp if (col <= lastcol) low = 0; 56632205254eSKarl Rupp else high = nrow; 566481824310SBarry Smith lastcol = col; 566581824310SBarry Smith while (high - low > 5) { 566681824310SBarry Smith t = (low + high) / 2; 566781824310SBarry Smith if (rp[t] > col) high = t; 566881824310SBarry Smith else low = t; 566981824310SBarry Smith } 567081824310SBarry Smith for (i = low; i < high; i++) { 567181824310SBarry Smith if (rp[i] > col) break; 567281824310SBarry Smith if (rp[i] == col) { 567381824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 567481824310SBarry Smith else ap[i] = value; 567581824310SBarry Smith goto noinsert; 567681824310SBarry Smith } 567781824310SBarry Smith } 567881824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 567981824310SBarry Smith if (nonew == 1) goto noinsert; 56805f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5681fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 56829371c9d4SSatish Balay N = nrow++ - 1; 56839371c9d4SSatish Balay a->nz++; 56849371c9d4SSatish Balay high++; 568581824310SBarry Smith /* shift up all the later entries in this row */ 568681824310SBarry Smith for (ii = N; ii >= i; ii--) { 568781824310SBarry Smith rp[ii + 1] = rp[ii]; 568881824310SBarry Smith ap[ii + 1] = ap[ii]; 568981824310SBarry Smith } 569081824310SBarry Smith rp[i] = col; 569181824310SBarry Smith ap[i] = value; 5692e56f5c9eSBarry Smith A->nonzerostate++; 569381824310SBarry Smith noinsert:; 569481824310SBarry Smith low = i + 1; 569581824310SBarry Smith } 569681824310SBarry Smith ailen[row] = nrow; 569781824310SBarry Smith } 569881824310SBarry Smith PetscFunctionReturnVoid(); 569981824310SBarry Smith } 570098921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 570198921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 570298921bdaSJacob Faibussowitsch * original definitions */ 57039566063dSJacob Faibussowitsch #undef PetscCall 570498921bdaSJacob Faibussowitsch #undef SETERRQ 5705