1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1226cec326SBarry Smith #define TYPE AIJ 1326cec326SBarry Smith #define TYPE_BS 1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 1626cec326SBarry Smith #undef TYPE 1726cec326SBarry Smith #undef TYPE_BS 1826cec326SBarry Smith 19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 20d71ae5a4SJacob Faibussowitsch { 214099cc6bSBarry Smith PetscBool flg; 224099cc6bSBarry Smith char type[256]; 234099cc6bSBarry Smith 244099cc6bSBarry Smith PetscFunctionBegin; 25d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 269566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 279566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 28d0609cedSBarry Smith PetscOptionsEnd(); 293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 304099cc6bSBarry Smith } 314099cc6bSBarry Smith 32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 33d71ae5a4SJacob Faibussowitsch { 340716a85fSBarry Smith PetscInt i, m, n; 350716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 360716a85fSBarry Smith 370716a85fSBarry Smith PetscFunctionBegin; 389566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 399566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 400716a85fSBarry Smith if (type == NORM_2) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 420716a85fSBarry Smith } else if (type == NORM_1) { 43ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 440716a85fSBarry Smith } else if (type == NORM_INFINITY) { 45ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 47ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 506adde796SStefano Zampini } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 510716a85fSBarry Smith 520716a85fSBarry Smith if (type == NORM_2) { 53a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 54857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 55a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 560716a85fSBarry Smith } 573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 580716a85fSBarry Smith } 590716a85fSBarry Smith 60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 61d71ae5a4SJacob Faibussowitsch { 623a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 633a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 643a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 653a062f41SBarry Smith PetscInt *rows; 663a062f41SBarry Smith 673a062f41SBarry Smith PetscFunctionBegin; 683a062f41SBarry Smith for (i = 0; i < m; i++) { 69ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 723a062f41SBarry Smith cnt = 0; 733a062f41SBarry Smith for (i = 0; i < m; i++) { 743a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 753a062f41SBarry Smith rows[cnt] = i; 763a062f41SBarry Smith cnt++; 773a062f41SBarry Smith } 783a062f41SBarry Smith } 799566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 813a062f41SBarry Smith } 823a062f41SBarry Smith 83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 84d71ae5a4SJacob Faibussowitsch { 856ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 86fff043a9SJunchao Zhang const MatScalar *aa; 876ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 88b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 896ce1633cSBarry Smith PetscInt *rows; 906ce1633cSBarry Smith 916ce1633cSBarry Smith PetscFunctionBegin; 929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 939566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 946ce1633cSBarry Smith diag = a->diag; 956ce1633cSBarry Smith for (i = 0; i < m; i++) { 96ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 976ce1633cSBarry Smith } 989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 996ce1633cSBarry Smith cnt = 0; 1006ce1633cSBarry Smith for (i = 0; i < m; i++) { 101ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 1026ce1633cSBarry Smith } 103f1f41ecbSJed Brown *nrows = cnt; 104f1f41ecbSJed Brown *zrows = rows; 1059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 107f1f41ecbSJed Brown } 108f1f41ecbSJed Brown 109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 110d71ae5a4SJacob Faibussowitsch { 111f1f41ecbSJed Brown PetscInt nrows, *rows; 112f1f41ecbSJed Brown 113f1f41ecbSJed Brown PetscFunctionBegin; 1140298fd71SBarry Smith *zrows = NULL; 1159566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1169566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1186ce1633cSBarry Smith } 1196ce1633cSBarry Smith 120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 121d71ae5a4SJacob Faibussowitsch { 122b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 123b3a44c85SBarry Smith const MatScalar *aa; 124b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 125b3a44c85SBarry Smith const PetscInt *ii; 126b3a44c85SBarry Smith PetscInt n, i, j, *rows; 127b3a44c85SBarry Smith 128b3a44c85SBarry Smith PetscFunctionBegin; 1299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 130f4259b30SLisandro Dalcin *keptrows = NULL; 131b3a44c85SBarry Smith ii = a->i; 132b3a44c85SBarry Smith for (i = 0; i < m; i++) { 133b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 134b3a44c85SBarry Smith if (!n) { 135b3a44c85SBarry Smith cnt++; 136b3a44c85SBarry Smith goto ok1; 137b3a44c85SBarry Smith } 1382e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 139b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 140b3a44c85SBarry Smith } 141b3a44c85SBarry Smith cnt++; 142b3a44c85SBarry Smith ok1:; 143b3a44c85SBarry Smith } 1442e5835c6SStefano Zampini if (!cnt) { 1459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1472e5835c6SStefano Zampini } 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 149b3a44c85SBarry Smith cnt = 0; 150b3a44c85SBarry Smith for (i = 0; i < m; i++) { 151b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 152b3a44c85SBarry Smith if (!n) continue; 1532e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 154b3a44c85SBarry Smith if (aa[j] != 0.0) { 155b3a44c85SBarry Smith rows[cnt++] = i; 156b3a44c85SBarry Smith break; 157b3a44c85SBarry Smith } 158b3a44c85SBarry Smith } 159b3a44c85SBarry Smith } 1609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1619566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 1623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 163b3a44c85SBarry Smith } 164b3a44c85SBarry Smith 165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 166d71ae5a4SJacob Faibussowitsch { 16779299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16899e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16999e65526SBarry Smith const PetscInt *diag; 1702e5835c6SStefano Zampini MatScalar *aa; 17199e65526SBarry Smith const PetscScalar *v; 172ace3abfcSBarry Smith PetscBool missing; 17379299369SBarry Smith 17479299369SBarry Smith PetscFunctionBegin; 17509f38230SBarry Smith if (Y->assembled) { 1769566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 17709f38230SBarry Smith if (!missing) { 17879299369SBarry Smith diag = aij->diag; 1799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 18179299369SBarry Smith if (is == INSERT_VALUES) { 182ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 18379299369SBarry Smith } else { 184ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 18579299369SBarry Smith } 1869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 1883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18979299369SBarry Smith } 1909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 19109f38230SBarry Smith } 1929566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 1933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 19409f38230SBarry Smith } 19579299369SBarry Smith 196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 197d71ae5a4SJacob Faibussowitsch { 198416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19997f1f81fSBarry Smith PetscInt i, ishift; 20017ab2063SBarry Smith 2013a40ed3dSBarry Smith PetscFunctionBegin; 202f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 2033ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 204bfeeae90SHong Zhang ishift = 0; 205b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 2069566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 207bfeeae90SHong Zhang } else if (oshift == 1) { 2081a83f524SJed Brown PetscInt *tia; 209d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2103b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2121a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2131a83f524SJed Brown *ia = tia; 214ecc77c7aSBarry Smith if (ja) { 2151a83f524SJed Brown PetscInt *tja; 2169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2171a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2181a83f524SJed Brown *ja = tja; 219ecc77c7aSBarry Smith } 2206945ee14SBarry Smith } else { 221ecc77c7aSBarry Smith *ia = a->i; 222ecc77c7aSBarry Smith if (ja) *ja = a->j; 223a2ce50c7SBarry Smith } 2243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225a2744918SBarry Smith } 226a2744918SBarry Smith 227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 228d71ae5a4SJacob Faibussowitsch { 2293a40ed3dSBarry Smith PetscFunctionBegin; 2303ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 231b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2329566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2339566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 234bcd2baecSBarry Smith } 2353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23617ab2063SBarry Smith } 23717ab2063SBarry Smith 238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 239d71ae5a4SJacob Faibussowitsch { 2403b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 241d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 24297f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2433b2fbd54SBarry Smith 2443a40ed3dSBarry Smith PetscFunctionBegin; 245899cda47SBarry Smith *nn = n; 2463ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2473b2fbd54SBarry Smith if (symmetric) { 2489566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2493b2fbd54SBarry Smith } else { 2509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2533b2fbd54SBarry Smith jj = a->j; 254ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2553b2fbd54SBarry Smith cia[0] = oshift; 256ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2583b2fbd54SBarry Smith jj = a->j; 259a93ec695SBarry Smith for (row = 0; row < m; row++) { 260a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 261a93ec695SBarry Smith for (i = 0; i < mr; i++) { 262bfeeae90SHong Zhang col = *jj++; 2632205254eSKarl Rupp 2643b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2653b2fbd54SBarry Smith } 2663b2fbd54SBarry Smith } 2679566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2689371c9d4SSatish Balay *ia = cia; 2699371c9d4SSatish Balay *ja = cja; 2703b2fbd54SBarry Smith } 2713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2723b2fbd54SBarry Smith } 2733b2fbd54SBarry Smith 274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 275d71ae5a4SJacob Faibussowitsch { 2763a40ed3dSBarry Smith PetscFunctionBegin; 2773ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2783b2fbd54SBarry Smith 2799566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2809566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2823b2fbd54SBarry Smith } 2833b2fbd54SBarry Smith 2847cee066cSHong Zhang /* 2857cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2867cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 287040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2887cee066cSHong Zhang */ 289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 290d71ae5a4SJacob Faibussowitsch { 2917cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2927cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 293071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2947cee066cSHong Zhang PetscInt *cspidx; 295071fcb05SBarry Smith const PetscInt *jj; 2967cee066cSHong Zhang 2977cee066cSHong Zhang PetscFunctionBegin; 2987cee066cSHong Zhang *nn = n; 2993ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 300625f6d37SHong Zhang 3019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 3029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 3039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 3057cee066cSHong Zhang jj = a->j; 306ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 3077cee066cSHong Zhang cia[0] = oshift; 308ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3107cee066cSHong Zhang jj = a->j; 3117cee066cSHong Zhang for (row = 0; row < m; row++) { 3127cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3137cee066cSHong Zhang for (i = 0; i < mr; i++) { 3147cee066cSHong Zhang col = *jj++; 315071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 316071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 317071fcb05SBarry Smith cja[tmp] = row + oshift; 3187cee066cSHong Zhang } 3197cee066cSHong Zhang } 3209566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 321071fcb05SBarry Smith *ia = cia; 322071fcb05SBarry Smith *ja = cja; 3237cee066cSHong Zhang *spidx = cspidx; 3243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 328d71ae5a4SJacob Faibussowitsch { 3297cee066cSHong Zhang PetscFunctionBegin; 3309566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3319566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3337cee066cSHong Zhang } 3347cee066cSHong Zhang 335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 336d71ae5a4SJacob Faibussowitsch { 33787d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33887d4246cSBarry Smith PetscInt *ai = a->i; 339fff043a9SJunchao Zhang PetscScalar *aa; 34087d4246cSBarry Smith 34187d4246cSBarry Smith PetscFunctionBegin; 3429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34687d4246cSBarry Smith } 34787d4246cSBarry Smith 348bd04181cSBarry Smith /* 349bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 350bd04181cSBarry Smith 351bd04181cSBarry Smith - a single row of values is set with each call 352bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 353bd04181cSBarry Smith - the values are always added to the matrix, not set 354bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 355bd04181cSBarry Smith 3561f763a69SBarry Smith This does NOT assume the global column indices are sorted 357bd04181cSBarry Smith 3581f763a69SBarry Smith */ 359bd04181cSBarry Smith 360af0996ceSBarry Smith #include <petsc/private/isimpl.h> 361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 362d71ae5a4SJacob Faibussowitsch { 363189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3641f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3651f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3661f763a69SBarry Smith PetscInt lastcol = -1; 367fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 368189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 369189e4007SBarry Smith 370fff043a9SJunchao Zhang PetscFunctionBegin; 3719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 372f38dd0b8SBarry Smith row = ridx[im[0]]; 3731f763a69SBarry Smith rp = aj + ai[row]; 3741f763a69SBarry Smith ap = aa + ai[row]; 3751f763a69SBarry Smith nrow = ailen[row]; 376189e4007SBarry Smith low = 0; 377189e4007SBarry Smith high = nrow; 378189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 379189e4007SBarry Smith col = cidx[in[l]]; 380f38dd0b8SBarry Smith value = v[l]; 381189e4007SBarry Smith 382189e4007SBarry Smith if (col <= lastcol) low = 0; 383189e4007SBarry Smith else high = nrow; 384189e4007SBarry Smith lastcol = col; 385189e4007SBarry Smith while (high - low > 5) { 386189e4007SBarry Smith t = (low + high) / 2; 387189e4007SBarry Smith if (rp[t] > col) high = t; 388189e4007SBarry Smith else low = t; 389189e4007SBarry Smith } 390189e4007SBarry Smith for (i = low; i < high; i++) { 391189e4007SBarry Smith if (rp[i] == col) { 3921f763a69SBarry Smith ap[i] += value; 393189e4007SBarry Smith low = i + 1; 3941f763a69SBarry Smith break; 395189e4007SBarry Smith } 396189e4007SBarry Smith } 397189e4007SBarry Smith } 3989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3993ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 400189e4007SBarry Smith } 401189e4007SBarry Smith 402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 403d71ae5a4SJacob Faibussowitsch { 404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 405e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 40697f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 407e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 408ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 409ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 410ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 41117ab2063SBarry Smith 4123a40ed3dSBarry Smith PetscFunctionBegin; 4139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 41417ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 415416022c9SBarry Smith row = im[k]; 4165ef9f2a5SBarry Smith if (row < 0) continue; 4176bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 418720833daSHong Zhang rp = aj + ai[row]; 419876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 4209371c9d4SSatish Balay rmax = imax[row]; 4219371c9d4SSatish Balay nrow = ailen[row]; 422416022c9SBarry Smith low = 0; 423c71e6ed7SBarry Smith high = nrow; 42417ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4255ef9f2a5SBarry Smith if (in[l] < 0) continue; 4266bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 427bfeeae90SHong Zhang col = in[l]; 428071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 429071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 43036db0b34SBarry Smith 4312205254eSKarl Rupp if (col <= lastcol) low = 0; 4322205254eSKarl Rupp else high = nrow; 433e2ee6c50SBarry Smith lastcol = col; 434416022c9SBarry Smith while (high - low > 5) { 435416022c9SBarry Smith t = (low + high) / 2; 436416022c9SBarry Smith if (rp[t] > col) high = t; 437416022c9SBarry Smith else low = t; 43817ab2063SBarry Smith } 439416022c9SBarry Smith for (i = low; i < high; i++) { 44017ab2063SBarry Smith if (rp[i] > col) break; 44117ab2063SBarry Smith if (rp[i] == col) { 442876c6284SHong Zhang if (!A->structure_only) { 4430c0d7e18SFande Kong if (is == ADD_VALUES) { 4440c0d7e18SFande Kong ap[i] += value; 4450c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4469371c9d4SSatish Balay } else ap[i] = value; 447720833daSHong Zhang } 448e44c0bd4SBarry Smith low = i + 1; 44917ab2063SBarry Smith goto noinsert; 45017ab2063SBarry Smith } 45117ab2063SBarry Smith } 452dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 453c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 45408401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 455720833daSHong Zhang if (A->structure_only) { 456876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 457720833daSHong Zhang } else { 458fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 459720833daSHong Zhang } 4609371c9d4SSatish Balay N = nrow++ - 1; 4619371c9d4SSatish Balay a->nz++; 4629371c9d4SSatish Balay high++; 463416022c9SBarry Smith /* shift up all the later entries in this row */ 4649566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 46517ab2063SBarry Smith rp[i] = col; 466580bdb30SBarry Smith if (!A->structure_only) { 4679566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 468580bdb30SBarry Smith ap[i] = value; 469580bdb30SBarry Smith } 470416022c9SBarry Smith low = i + 1; 471e56f5c9eSBarry Smith A->nonzerostate++; 472e44c0bd4SBarry Smith noinsert:; 47317ab2063SBarry Smith } 47417ab2063SBarry Smith ailen[row] = nrow; 47517ab2063SBarry Smith } 4769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 47817ab2063SBarry Smith } 47917ab2063SBarry Smith 480ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 481d71ae5a4SJacob Faibussowitsch { 48219b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 48319b08ed1SBarry Smith PetscInt *rp, k, row; 48419b08ed1SBarry Smith PetscInt *ai = a->i; 48519b08ed1SBarry Smith PetscInt *aj = a->j; 486fff043a9SJunchao Zhang MatScalar *aa, *ap; 48719b08ed1SBarry Smith 48819b08ed1SBarry Smith PetscFunctionBegin; 48928b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 49008401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 491fff043a9SJunchao Zhang 4929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 49319b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 49419b08ed1SBarry Smith row = im[k]; 49519b08ed1SBarry Smith rp = aj + ai[row]; 49619b08ed1SBarry Smith ap = aa + ai[row]; 49719b08ed1SBarry Smith 4989566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49919b08ed1SBarry Smith if (!A->structure_only) { 50019b08ed1SBarry Smith if (v) { 5019566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 50219b08ed1SBarry Smith v += n; 50319b08ed1SBarry Smith } else { 5049566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 50519b08ed1SBarry Smith } 50619b08ed1SBarry Smith } 50719b08ed1SBarry Smith a->ilen[row] = n; 50819b08ed1SBarry Smith a->imax[row] = n; 50919b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 51019b08ed1SBarry Smith a->nz += n; 51119b08ed1SBarry Smith } 5129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51419b08ed1SBarry Smith } 51519b08ed1SBarry Smith 51619b08ed1SBarry Smith /*@ 51719b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51819b08ed1SBarry Smith 51919b08ed1SBarry Smith Input Parameters: 52011a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 52119b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 52219b08ed1SBarry Smith 52319b08ed1SBarry Smith Level: advanced 52419b08ed1SBarry Smith 52519b08ed1SBarry Smith Notes: 52619b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 52711a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52819b08ed1SBarry Smith as always with multiple matrix assemblies. 52919b08ed1SBarry Smith 5301cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 53119b08ed1SBarry Smith @*/ 532d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 533d71ae5a4SJacob Faibussowitsch { 53419b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 53519b08ed1SBarry Smith 53619b08ed1SBarry Smith PetscFunctionBegin; 5379566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5389566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53919b08ed1SBarry Smith a->maxnz = nztotal; 5404dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 54119b08ed1SBarry Smith if (!a->ilen) { 5429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 54319b08ed1SBarry Smith } else { 5449566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 54519b08ed1SBarry Smith } 54619b08ed1SBarry Smith 54719b08ed1SBarry Smith /* allocate the matrix space */ 54819b08ed1SBarry Smith if (A->structure_only) { 5499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal, &a->j)); 5509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i)); 55119b08ed1SBarry Smith } else { 5529566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i)); 55319b08ed1SBarry Smith } 55419b08ed1SBarry Smith a->i[0] = 0; 55519b08ed1SBarry Smith if (A->structure_only) { 55619b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 55719b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55819b08ed1SBarry Smith } else { 55919b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 56019b08ed1SBarry Smith a->free_a = PETSC_TRUE; 56119b08ed1SBarry Smith } 56219b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 56319b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 56419b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 5653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56619b08ed1SBarry Smith } 56719b08ed1SBarry Smith 568ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 569d71ae5a4SJacob Faibussowitsch { 570071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 571071fcb05SBarry Smith PetscInt *rp, k, row; 572071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 573071fcb05SBarry Smith PetscInt *aj = a->j; 574fff043a9SJunchao Zhang MatScalar *aa, *ap; 575071fcb05SBarry Smith 576071fcb05SBarry Smith PetscFunctionBegin; 5779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 578071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 579071fcb05SBarry Smith row = im[k]; 5806bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 581071fcb05SBarry Smith rp = aj + ai[row]; 582071fcb05SBarry Smith ap = aa + ai[row]; 58348a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 584071fcb05SBarry Smith if (!A->structure_only) { 585071fcb05SBarry Smith if (v) { 5869566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 587071fcb05SBarry Smith v += n; 588071fcb05SBarry Smith } else { 5899566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 590071fcb05SBarry Smith } 591071fcb05SBarry Smith } 592071fcb05SBarry Smith ailen[row] = n; 593071fcb05SBarry Smith a->nz += n; 594071fcb05SBarry Smith } 5959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 597071fcb05SBarry Smith } 598071fcb05SBarry Smith 599ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 600d71ae5a4SJacob Faibussowitsch { 6017eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 60297f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 60397f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 6044e208921SJed Brown const MatScalar *ap, *aa; 6057eb43aa7SLois Curfman McInnes 6063a40ed3dSBarry Smith PetscFunctionBegin; 6074e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6087eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6097eb43aa7SLois Curfman McInnes row = im[k]; 6109371c9d4SSatish Balay if (row < 0) { 6119371c9d4SSatish Balay v += n; 6129371c9d4SSatish Balay continue; 6139371c9d4SSatish Balay } /* negative row */ 61454c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6159371c9d4SSatish Balay rp = aj + ai[row]; 6169371c9d4SSatish Balay ap = aa + ai[row]; 6177eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6187eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6199371c9d4SSatish Balay if (in[l] < 0) { 6209371c9d4SSatish Balay v++; 6219371c9d4SSatish Balay continue; 6229371c9d4SSatish Balay } /* negative column */ 62354c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 624bfeeae90SHong Zhang col = in[l]; 6259371c9d4SSatish Balay high = nrow; 6269371c9d4SSatish Balay low = 0; /* assume unsorted */ 6277eb43aa7SLois Curfman McInnes while (high - low > 5) { 6287eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6297eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6307eb43aa7SLois Curfman McInnes else low = t; 6317eb43aa7SLois Curfman McInnes } 6327eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6337eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6347eb43aa7SLois Curfman McInnes if (rp[i] == col) { 635b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6367eb43aa7SLois Curfman McInnes goto finished; 6377eb43aa7SLois Curfman McInnes } 6387eb43aa7SLois Curfman McInnes } 63997e567efSBarry Smith *v++ = 0.0; 6407eb43aa7SLois Curfman McInnes finished:; 6417eb43aa7SLois Curfman McInnes } 6427eb43aa7SLois Curfman McInnes } 6434e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6457eb43aa7SLois Curfman McInnes } 6467eb43aa7SLois Curfman McInnes 647ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 648d71ae5a4SJacob Faibussowitsch { 6493ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 650c898d852SStefano Zampini const PetscScalar *av; 6513ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6523ea6fe3dSLisandro Dalcin PetscInt *rowlens; 65317ab2063SBarry Smith 6543a40ed3dSBarry Smith PetscFunctionBegin; 6559566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6562205254eSKarl Rupp 6573ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6583ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6593ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6603ea6fe3dSLisandro Dalcin nz = A->nz; 661416022c9SBarry Smith 6623ea6fe3dSLisandro Dalcin /* write matrix header */ 6633ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6649371c9d4SSatish Balay header[1] = M; 6659371c9d4SSatish Balay header[2] = N; 6669371c9d4SSatish Balay header[3] = nz; 6679566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 668416022c9SBarry Smith 6693ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6709566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6713ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6729566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6739566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6743ea6fe3dSLisandro Dalcin /* store column indices */ 6759566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 676416022c9SBarry Smith /* store nonzero values */ 6779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6789566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 680b37d52dbSMark F. Adams 6813ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6829566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 68417ab2063SBarry Smith } 685416022c9SBarry Smith 686d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 687d71ae5a4SJacob Faibussowitsch { 6887dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6897dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6907dc0baabSHong Zhang 6917dc0baabSHong Zhang PetscFunctionBegin; 6929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6937dc0baabSHong Zhang for (i = 0; i < m; i++) { 6949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 69548a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6977dc0baabSHong Zhang } 6989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7007dc0baabSHong Zhang } 7017dc0baabSHong Zhang 70209573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 703cd155464SBarry Smith 704ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 705d71ae5a4SJacob Faibussowitsch { 706416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 707c898d852SStefano Zampini const PetscScalar *av; 70860e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 709e060cb09SBarry Smith const char *name; 710f3ef73ceSBarry Smith PetscViewerFormat format; 71117ab2063SBarry Smith 7123a40ed3dSBarry Smith PetscFunctionBegin; 7137dc0baabSHong Zhang if (A->structure_only) { 7149566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7167dc0baabSHong Zhang } 71743e49210SHong Zhang 7189566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 7193ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 7202e5835c6SStefano Zampini 721c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 72471c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 72597f1f81fSBarry Smith PetscInt nofinalvalue = 0; 72660e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 727c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 728d00d2cf4SBarry Smith nofinalvalue = 1; 729d00d2cf4SBarry Smith } 7309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 733fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 735fbfe6fa7SJed Brown #else 7369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 737fbfe6fa7SJed Brown #endif 7389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73917ab2063SBarry Smith 74017ab2063SBarry Smith for (i = 0; i < m; i++) { 74160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 742aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7439566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 74417ab2063SBarry Smith #else 7459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 74617ab2063SBarry Smith #endif 74717ab2063SBarry Smith } 74817ab2063SBarry Smith } 749d00d2cf4SBarry Smith if (nofinalvalue) { 750c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 752c337ccceSJed Brown #else 7539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 754c337ccceSJed Brown #endif 755d00d2cf4SBarry Smith } 7569566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 759fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7609566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 76144cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7629566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 76360e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 764aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 76536db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76736db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76936db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7716831982aSBarry Smith } 77244cd7ae7SLois Curfman McInnes #else 7739566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 77444cd7ae7SLois Curfman McInnes #endif 77544cd7ae7SLois Curfman McInnes } 7769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77744cd7ae7SLois Curfman McInnes } 7789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 779fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 78097f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7819566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 783496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 784496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 78560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 786496be53dSLois Curfman McInnes if (a->j[j] >= i) { 787aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78836db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 789496be53dSLois Curfman McInnes #else 790496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 791496be53dSLois Curfman McInnes #endif 792496be53dSLois Curfman McInnes } 793496be53dSLois Curfman McInnes } 794496be53dSLois Curfman McInnes } 7952e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7972e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7982205254eSKarl Rupp if (i + 4 < m) { 7999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 8002205254eSKarl Rupp } else if (i + 3 < m) { 8019566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 8022205254eSKarl Rupp } else if (i + 2 < m) { 8039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 8042205254eSKarl Rupp } else if (i + 1 < m) { 8059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 8062205254eSKarl Rupp } else if (i < m) { 8079566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8082205254eSKarl Rupp } else { 8099566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8102205254eSKarl Rupp } 811496be53dSLois Curfman McInnes } 8129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8139566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 814496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8169566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 817496be53dSLois Curfman McInnes } 8189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 819496be53dSLois Curfman McInnes } 8209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 821496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 82260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 823496be53dSLois Curfman McInnes if (a->j[j] >= i) { 824aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 82548a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 826496be53dSLois Curfman McInnes #else 8279566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 828496be53dSLois Curfman McInnes #endif 829496be53dSLois Curfman McInnes } 830496be53dSLois Curfman McInnes } 8319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 832496be53dSLois Curfman McInnes } 8339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 834fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 83597f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 83687828ca2SBarry Smith PetscScalar value; 83768f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83868f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83968f1ed48SBarry Smith 84068f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 84168f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 84268f1ed48SBarry Smith realonly = PETSC_FALSE; 84368f1ed48SBarry Smith break; 84468f1ed48SBarry Smith } 84568f1ed48SBarry Smith } 84668f1ed48SBarry Smith #endif 84702594712SBarry Smith 8489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84902594712SBarry Smith for (i = 0; i < m; i++) { 85002594712SBarry Smith jcnt = 0; 851d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 852e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 85302594712SBarry Smith value = a->a[cnt++]; 854e24b481bSBarry Smith jcnt++; 85502594712SBarry Smith } else { 85602594712SBarry Smith value = 0.0; 85702594712SBarry Smith } 858aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85968f1ed48SBarry Smith if (realonly) { 8609566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 86168f1ed48SBarry Smith } else { 8629566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 86368f1ed48SBarry Smith } 86402594712SBarry Smith #else 8659566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 86602594712SBarry Smith #endif 86702594712SBarry Smith } 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86902594712SBarry Smith } 8709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8713c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 872150b93efSMatthew G. Knepley PetscInt fshift = 1; 8739566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8743c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8759566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8763c215bfdSMatthew Knepley #else 8779566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8783c215bfdSMatthew Knepley #endif 8799566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8803c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 88160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8823c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8839566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8843c215bfdSMatthew Knepley #else 8859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8863c215bfdSMatthew Knepley #endif 8873c215bfdSMatthew Knepley } 8883c215bfdSMatthew Knepley } 8899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8903a40ed3dSBarry Smith } else { 8919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 892d5f3da31SBarry Smith if (A->factortype) { 89316cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 89516cd7e1dSShri Abhyankar /* L part */ 89660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89716cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89816cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 90016cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9019566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 90216cd7e1dSShri Abhyankar } else { 9039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 90416cd7e1dSShri Abhyankar } 90516cd7e1dSShri Abhyankar #else 9069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90716cd7e1dSShri Abhyankar #endif 90816cd7e1dSShri Abhyankar } 90916cd7e1dSShri Abhyankar /* diagonal */ 91016cd7e1dSShri Abhyankar j = a->diag[i]; 91116cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91216cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 91416cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 91616cd7e1dSShri Abhyankar } else { 9179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91816cd7e1dSShri Abhyankar } 91916cd7e1dSShri Abhyankar #else 9209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 92116cd7e1dSShri Abhyankar #endif 92216cd7e1dSShri Abhyankar 92316cd7e1dSShri Abhyankar /* U part */ 92460e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 92516cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 92616cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92816cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 93016cd7e1dSShri Abhyankar } else { 9319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 93216cd7e1dSShri Abhyankar } 93316cd7e1dSShri Abhyankar #else 9349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 93516cd7e1dSShri Abhyankar #endif 93616cd7e1dSShri Abhyankar } 9379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93816cd7e1dSShri Abhyankar } 93916cd7e1dSShri Abhyankar } else { 94017ab2063SBarry Smith for (i = 0; i < m; i++) { 9419566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 94260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 943aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 94436db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 94636db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9479566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9483a40ed3dSBarry Smith } else { 9499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 95017ab2063SBarry Smith } 95117ab2063SBarry Smith #else 9529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 95317ab2063SBarry Smith #endif 95417ab2063SBarry Smith } 9559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 95617ab2063SBarry Smith } 95716cd7e1dSShri Abhyankar } 9589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95917ab2063SBarry Smith } 9609566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 962416022c9SBarry Smith } 963416022c9SBarry Smith 9649804daf3SBarry Smith #include <petscdraw.h> 965ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 966d71ae5a4SJacob Faibussowitsch { 967480ef9eaSBarry Smith Mat A = (Mat)Aa; 968416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 969383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 970383922c3SLisandro Dalcin int color; 971b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 972b0a32e0cSBarry Smith PetscViewer viewer; 973f3ef73ceSBarry Smith PetscViewerFormat format; 974fff043a9SJunchao Zhang const PetscScalar *aa; 975cddf8d76SBarry Smith 9763a40ed3dSBarry Smith PetscFunctionBegin; 9779566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9789566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9799566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 980383922c3SLisandro Dalcin 981416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 983fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 984d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9850513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 986b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 987416022c9SBarry Smith for (i = 0; i < m; i++) { 9889371c9d4SSatish Balay y_l = m - i - 1.0; 9899371c9d4SSatish Balay y_r = y_l + 1.0; 990bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9919371c9d4SSatish Balay x_l = a->j[j]; 9929371c9d4SSatish Balay x_r = x_l + 1.0; 993fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9949566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 995cddf8d76SBarry Smith } 996cddf8d76SBarry Smith } 997b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 998cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9999371c9d4SSatish Balay y_l = m - i - 1.0; 10009371c9d4SSatish Balay y_r = y_l + 1.0; 1001bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10029371c9d4SSatish Balay x_l = a->j[j]; 10039371c9d4SSatish Balay x_r = x_l + 1.0; 1004fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10059566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1006cddf8d76SBarry Smith } 1007cddf8d76SBarry Smith } 1008b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1009cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10109371c9d4SSatish Balay y_l = m - i - 1.0; 10119371c9d4SSatish Balay y_r = y_l + 1.0; 1012bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10139371c9d4SSatish Balay x_l = a->j[j]; 10149371c9d4SSatish Balay x_r = x_l + 1.0; 1015fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10169566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1017416022c9SBarry Smith } 1018416022c9SBarry Smith } 1019d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10200513a670SBarry Smith } else { 10210513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10220513a670SBarry Smith /* first determine max of all nonzero values */ 1023b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1024383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1025b0a32e0cSBarry Smith PetscDraw popup; 10260513a670SBarry Smith 10270513a670SBarry Smith for (i = 0; i < nz; i++) { 1028fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10290513a670SBarry Smith } 1030383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10319566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10329566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1033383922c3SLisandro Dalcin 1034d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10350513a670SBarry Smith for (i = 0; i < m; i++) { 1036383922c3SLisandro Dalcin y_l = m - i - 1.0; 1037383922c3SLisandro Dalcin y_r = y_l + 1.0; 1038bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1039383922c3SLisandro Dalcin x_l = a->j[j]; 1040383922c3SLisandro Dalcin x_r = x_l + 1.0; 1041fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10429566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10430513a670SBarry Smith count++; 10440513a670SBarry Smith } 10450513a670SBarry Smith } 1046d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10470513a670SBarry Smith } 10489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 10493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1050480ef9eaSBarry Smith } 1051cddf8d76SBarry Smith 10529804daf3SBarry Smith #include <petscdraw.h> 1053ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1054d71ae5a4SJacob Faibussowitsch { 1055b0a32e0cSBarry Smith PetscDraw draw; 105636db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1057ace3abfcSBarry Smith PetscBool isnull; 1058480ef9eaSBarry Smith 1059480ef9eaSBarry Smith PetscFunctionBegin; 10609566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10619566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 10623ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 1063480ef9eaSBarry Smith 10649371c9d4SSatish Balay xr = A->cmap->n; 10659371c9d4SSatish Balay yr = A->rmap->n; 10669371c9d4SSatish Balay h = yr / 10.0; 10679371c9d4SSatish Balay w = xr / 10.0; 10689371c9d4SSatish Balay xr += w; 10699371c9d4SSatish Balay yr += h; 10709371c9d4SSatish Balay xl = -w; 10719371c9d4SSatish Balay yl = -h; 10729566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10739566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10749566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10759566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10769566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1078416022c9SBarry Smith } 1079416022c9SBarry Smith 1080d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1081d71ae5a4SJacob Faibussowitsch { 1082ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1083416022c9SBarry Smith 10843a40ed3dSBarry Smith PetscFunctionBegin; 10859566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10869566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10879566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10881baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10891baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10901baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10919566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 109317ab2063SBarry Smith } 109419bcc07fSBarry Smith 1095d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1096d71ae5a4SJacob Faibussowitsch { 1097416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1098580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1099d0f46423SBarry Smith PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0; 110054f21887SBarry Smith MatScalar *aa = a->a, *ap; 11013447b6efSHong Zhang PetscReal ratio = 0.6; 110217ab2063SBarry Smith 11033a40ed3dSBarry Smith PetscFunctionBegin; 11043ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 11059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1106b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1107b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11089566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1110b215bc84SStefano Zampini } 111117ab2063SBarry Smith 111243ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 111317ab2063SBarry Smith for (i = 1; i < m; i++) { 1114416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 111517ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 111694a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111717ab2063SBarry Smith if (fshift) { 1118bfeeae90SHong Zhang ip = aj + ai[i]; 1119bfeeae90SHong Zhang ap = aa + ai[i]; 112017ab2063SBarry Smith N = ailen[i]; 11219566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 112248a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 112317ab2063SBarry Smith } 112417ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 112517ab2063SBarry Smith } 112617ab2063SBarry Smith if (m) { 112717ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112817ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112917ab2063SBarry Smith } 113017ab2063SBarry Smith /* reset ilen and imax for each row */ 11317b083b7cSBarry Smith a->nonzerorowcnt = 0; 1132396832f4SHong Zhang if (A->structure_only) { 11339566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11349566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1135396832f4SHong Zhang } else { /* !A->structure_only */ 113617ab2063SBarry Smith for (i = 0; i < m; i++) { 113717ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11387b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113917ab2063SBarry Smith } 1140396832f4SHong Zhang } 1141bfeeae90SHong Zhang a->nz = ai[m]; 1142aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 114317ab2063SBarry Smith 11449566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 11459566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11469566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11479566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11482205254eSKarl Rupp 11498e58a170SBarry Smith A->info.mallocs += a->reallocs; 1150dd5f02e7SSatish Balay a->reallocs = 0; 11516712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 115236db0b34SBarry Smith a->rmax = rmax; 11534e220ebcSLois Curfman McInnes 115448a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11559566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 115717ab2063SBarry Smith } 115817ab2063SBarry Smith 1159ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1160d71ae5a4SJacob Faibussowitsch { 116199cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 116299cafbc1SBarry Smith PetscInt i, nz = a->nz; 11632e5835c6SStefano Zampini MatScalar *aa; 116499cafbc1SBarry Smith 116599cafbc1SBarry Smith PetscFunctionBegin; 11669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 116799cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 117199cafbc1SBarry Smith } 117299cafbc1SBarry Smith 1173ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1174d71ae5a4SJacob Faibussowitsch { 117599cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 117699cafbc1SBarry Smith PetscInt i, nz = a->nz; 11772e5835c6SStefano Zampini MatScalar *aa; 117899cafbc1SBarry Smith 117999cafbc1SBarry Smith PetscFunctionBegin; 11809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 118199cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 118599cafbc1SBarry Smith } 118699cafbc1SBarry Smith 1187d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1188d71ae5a4SJacob Faibussowitsch { 1189fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1190fff043a9SJunchao Zhang MatScalar *aa; 11913a40ed3dSBarry Smith 11923a40ed3dSBarry Smith PetscFunctionBegin; 11939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 11949566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 11959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 11969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119817ab2063SBarry Smith } 1199416022c9SBarry Smith 1200d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1201d71ae5a4SJacob Faibussowitsch { 1202416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1203d5d45c9bSBarry Smith 12043a40ed3dSBarry Smith PetscFunctionBegin; 1205b4e2f619SBarry Smith if (A->hash_active) { 1206e3c72094SPierre Jolivet A->ops[0] = a->cops; 1207b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 1208b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 1209b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 1210b4e2f619SBarry Smith } 1211b4e2f619SBarry Smith 12123ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz)); 12139566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12149566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12159566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12169566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12179566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12189566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12199566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12209566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12219566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12229566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12239566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12259566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12269566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1228901853e0SKris Buschelman 12296718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12306718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12316718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12326718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12336718818eSStefano Zampini due to different matrix sizes */ 12349566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12356718818eSStefano Zampini 12369566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12372e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12382e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12452e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12462e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12472e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12482e956fe4SStefano Zampini #endif 12494222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12534222ddf1SHong Zhang #endif 1254d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 1255d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL)); 1256d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL)); 1257d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL)); 1258d5e393b6SSuyash Tandon #endif 12593d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12613d0639e7SStefano Zampini #endif 12629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1263af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1265af8000cdSHong Zhang #endif 1266d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1268d24d4204SJose E. Roman #endif 126963c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 127263c07aadSStefano Zampini #endif 12739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12772e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12882e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12892e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12902e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12912e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 12922e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 12932e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 12942e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 12953ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 129617ab2063SBarry Smith } 129717ab2063SBarry Smith 1298d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1299d71ae5a4SJacob Faibussowitsch { 1300416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13013a40ed3dSBarry Smith 13023a40ed3dSBarry Smith PetscFunctionBegin; 1303a65d3064SKris Buschelman switch (op) { 1304d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1305d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1306d71ae5a4SJacob Faibussowitsch break; 1307d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1308d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1309d71ae5a4SJacob Faibussowitsch break; 1310d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1311d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1312d71ae5a4SJacob Faibussowitsch break; 1313d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1314d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1315d71ae5a4SJacob Faibussowitsch break; 1316d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1317d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1318d71ae5a4SJacob Faibussowitsch break; 1319d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1320d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1321d71ae5a4SJacob Faibussowitsch break; 1322d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1323d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1324d71ae5a4SJacob Faibussowitsch break; 13253d472b54SHong Zhang case MAT_SPD: 1326b1646e73SJed Brown case MAT_SYMMETRIC: 1327b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1328b1646e73SJed Brown case MAT_HERMITIAN: 1329b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1330957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1331b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1332b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1333b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13345021d80fSJed Brown break; 13358c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1336a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1337d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1338d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1339d71ae5a4SJacob Faibussowitsch break; 1340d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1341d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1342d71ae5a4SJacob Faibussowitsch break; 1343d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1344d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1345d71ae5a4SJacob Faibussowitsch break; 1346071fcb05SBarry Smith case MAT_SORTED_FULL: 1347071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1348071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1349071fcb05SBarry Smith break; 1350d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1351d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1352d71ae5a4SJacob Faibussowitsch break; 1353d71ae5a4SJacob Faibussowitsch default: 1354d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1355a65d3064SKris Buschelman } 13563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 135717ab2063SBarry Smith } 135817ab2063SBarry Smith 1359ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1360d71ae5a4SJacob Faibussowitsch { 1361416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1362fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1363c898d852SStefano Zampini PetscScalar *x; 1364c898d852SStefano Zampini const PetscScalar *aa; 136517ab2063SBarry Smith 13663a40ed3dSBarry Smith PetscFunctionBegin; 13679566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 136808401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1370d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1371d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13729566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13732c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13749566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 137735e7444dSHong Zhang } 137835e7444dSHong Zhang 13799566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 138035e7444dSHong Zhang for (i = 0; i < n; i++) { 1381fdc842d1SBarry Smith x[i] = 0.0; 138235e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 138335e7444dSHong Zhang if (aj[j] == i) { 138435e7444dSHong Zhang x[i] = aa[j]; 138517ab2063SBarry Smith break; 138617ab2063SBarry Smith } 138717ab2063SBarry Smith } 138817ab2063SBarry Smith } 13899566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 139217ab2063SBarry Smith } 139317ab2063SBarry Smith 1394c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1395d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1396d71ae5a4SJacob Faibussowitsch { 1397416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13985f22a7b3SSebastian Grimberg const MatScalar *aa; 1399d9ca1df4SBarry Smith PetscScalar *y; 1400d9ca1df4SBarry Smith const PetscScalar *x; 1401d0f46423SBarry Smith PetscInt m = A->rmap->n; 14025c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14035f22a7b3SSebastian Grimberg const MatScalar *v; 1404a77337e4SBarry Smith PetscScalar alpha; 1405d9ca1df4SBarry Smith PetscInt n, i, j; 1406d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14073447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1408ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14095c897100SBarry Smith #endif 141017ab2063SBarry Smith 14113a40ed3dSBarry Smith PetscFunctionBegin; 14129566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14139566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14149566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14165c897100SBarry Smith 14175c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1418fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14195c897100SBarry Smith #else 14203447b6efSHong Zhang if (usecprow) { 14213447b6efSHong Zhang m = cprow.nrows; 14223447b6efSHong Zhang ii = cprow.i; 14237b2bb3b9SHong Zhang ridx = cprow.rindex; 14243447b6efSHong Zhang } else { 14253447b6efSHong Zhang ii = a->i; 14263447b6efSHong Zhang } 142717ab2063SBarry Smith for (i = 0; i < m; i++) { 14283447b6efSHong Zhang idx = a->j + ii[i]; 1429fff043a9SJunchao Zhang v = aa + ii[i]; 14303447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14313447b6efSHong Zhang if (usecprow) { 14327b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14333447b6efSHong Zhang } else { 143417ab2063SBarry Smith alpha = x[i]; 14353447b6efSHong Zhang } 143604fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 143717ab2063SBarry Smith } 14385c897100SBarry Smith #endif 14399566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14409566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14419566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 144417ab2063SBarry Smith } 144517ab2063SBarry Smith 1446d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1447d71ae5a4SJacob Faibussowitsch { 14485c897100SBarry Smith PetscFunctionBegin; 14499566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14509566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14525c897100SBarry Smith } 14535c897100SBarry Smith 1454c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 145578b84d54SShri Abhyankar 1456d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1457d71ae5a4SJacob Faibussowitsch { 1458416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1459d9fead3dSBarry Smith PetscScalar *y; 146054f21887SBarry Smith const PetscScalar *x; 1461fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1462003131ecSBarry Smith PetscInt m = A->rmap->n; 14630298fd71SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 14647b083b7cSBarry Smith PetscInt n, i; 1465362ced78SSatish Balay PetscScalar sum; 1466ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 146717ab2063SBarry Smith 1468b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 146997952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1470fee21e36SBarry Smith #endif 1471fee21e36SBarry Smith 14723a40ed3dSBarry Smith PetscFunctionBegin; 1473b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14749566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 14753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1476b215bc84SStefano Zampini } 14779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14789566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14799566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1480416022c9SBarry Smith ii = a->i; 14814eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14829566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 148397952fefSHong Zhang m = a->compressedrow.nrows; 148497952fefSHong Zhang ii = a->compressedrow.i; 148597952fefSHong Zhang ridx = a->compressedrow.rindex; 148697952fefSHong Zhang for (i = 0; i < m; i++) { 148797952fefSHong Zhang n = ii[i + 1] - ii[i]; 148897952fefSHong Zhang aj = a->j + ii[i]; 1489fff043a9SJunchao Zhang aa = a_a + ii[i]; 149097952fefSHong Zhang sum = 0.0; 1491003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1492003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 149397952fefSHong Zhang y[*ridx++] = sum; 149497952fefSHong Zhang } 149597952fefSHong Zhang } else { /* do not use compressed row format */ 1496b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 14973d3eaba7SBarry Smith aj = a->j; 1498fff043a9SJunchao Zhang aa = a_a; 1499b05257ddSBarry Smith fortranmultaij_(&m, x, ii, aj, aa, y); 1500b05257ddSBarry Smith #else 150117ab2063SBarry Smith for (i = 0; i < m; i++) { 1502003131ecSBarry Smith n = ii[i + 1] - ii[i]; 1503003131ecSBarry Smith aj = a->j + ii[i]; 1504fff043a9SJunchao Zhang aa = a_a + ii[i]; 150517ab2063SBarry Smith sum = 0.0; 1506003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 150717ab2063SBarry Smith y[i] = sum; 150817ab2063SBarry Smith } 15098d195f9aSBarry Smith #endif 1510b05257ddSBarry Smith } 15119566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15129566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15139566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 151617ab2063SBarry Smith } 151717ab2063SBarry Smith 1518ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1519ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1520d71ae5a4SJacob Faibussowitsch { 1521b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1522b434eb95SMatthew G. Knepley PetscScalar *y; 1523b434eb95SMatthew G. Knepley const PetscScalar *x; 1524fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1525b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1526b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1527b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1528b434eb95SMatthew G. Knepley PetscScalar sum; 1529b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1530b434eb95SMatthew G. Knepley 1531b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1532b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1533b434eb95SMatthew G. Knepley #endif 1534b434eb95SMatthew G. Knepley 1535b434eb95SMatthew G. Knepley PetscFunctionBegin; 15369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15379566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15389566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1539b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1540b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1541b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1542b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1543b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1544b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1545b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1546fff043a9SJunchao Zhang aa = a_a + ii[i]; 1547b434eb95SMatthew G. Knepley sum = 0.0; 1548b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1549b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1550b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1551b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1552b434eb95SMatthew G. Knepley } 1553b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15543d3eaba7SBarry Smith ii = a->i; 1555b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1556b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1557b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1558fff043a9SJunchao Zhang aa = a_a + ii[i]; 1559b434eb95SMatthew G. Knepley sum = 0.0; 1560b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1561b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1562b434eb95SMatthew G. Knepley y[i] = sum; 1563b434eb95SMatthew G. Knepley } 1564b434eb95SMatthew G. Knepley } 15659566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15669566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15679566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1570b434eb95SMatthew G. Knepley } 1571b434eb95SMatthew G. Knepley 1572ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1573ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1574d71ae5a4SJacob Faibussowitsch { 1575b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1576b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1577b434eb95SMatthew G. Knepley const PetscScalar *x; 1578fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1579b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1580b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1581b434eb95SMatthew G. Knepley PetscScalar sum; 1582b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1583b434eb95SMatthew G. Knepley 1584b434eb95SMatthew G. Knepley PetscFunctionBegin; 15859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15869566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15879566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1588b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 158948a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1590b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1591b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1592b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1593b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1594b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1595b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1596fff043a9SJunchao Zhang aa = a_a + ii[i]; 1597b434eb95SMatthew G. Knepley sum = y[*ridx]; 1598b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1599b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1600b434eb95SMatthew G. Knepley } 1601b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16023d3eaba7SBarry Smith ii = a->i; 1603b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1604b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1605b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1606fff043a9SJunchao Zhang aa = a_a + ii[i]; 1607b434eb95SMatthew G. Knepley sum = y[i]; 1608b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1609b434eb95SMatthew G. Knepley z[i] = sum; 1610b434eb95SMatthew G. Knepley } 1611b434eb95SMatthew G. Knepley } 16129566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16139566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16149566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1617b434eb95SMatthew G. Knepley } 1618b434eb95SMatthew G. Knepley 1619c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1620d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1621d71ae5a4SJacob Faibussowitsch { 1622416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1623f15663dcSBarry Smith PetscScalar *y, *z; 1624f15663dcSBarry Smith const PetscScalar *x; 1625fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1626d9ca1df4SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 1627d9ca1df4SBarry Smith PetscInt m = A->rmap->n, n, i; 1628362ced78SSatish Balay PetscScalar sum; 1629ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16309ea0dfa2SSatish Balay 16313a40ed3dSBarry Smith PetscFunctionBegin; 1632b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16339566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 16343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1635b215bc84SStefano Zampini } 16369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16379566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16389566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16394eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 164048a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 164197952fefSHong Zhang m = a->compressedrow.nrows; 164297952fefSHong Zhang ii = a->compressedrow.i; 164397952fefSHong Zhang ridx = a->compressedrow.rindex; 164497952fefSHong Zhang for (i = 0; i < m; i++) { 164597952fefSHong Zhang n = ii[i + 1] - ii[i]; 164697952fefSHong Zhang aj = a->j + ii[i]; 1647fff043a9SJunchao Zhang aa = a_a + ii[i]; 164897952fefSHong Zhang sum = y[*ridx]; 1649f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165097952fefSHong Zhang z[*ridx++] = sum; 165197952fefSHong Zhang } 165297952fefSHong Zhang } else { /* do not use compressed row format */ 16533d3eaba7SBarry Smith ii = a->i; 1654f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16553d3eaba7SBarry Smith aj = a->j; 1656fff043a9SJunchao Zhang aa = a_a; 1657f15663dcSBarry Smith fortranmultaddaij_(&m, x, ii, aj, aa, y, z); 1658f15663dcSBarry Smith #else 165917ab2063SBarry Smith for (i = 0; i < m; i++) { 1660f15663dcSBarry Smith n = ii[i + 1] - ii[i]; 1661f15663dcSBarry Smith aj = a->j + ii[i]; 1662fff043a9SJunchao Zhang aa = a_a + ii[i]; 166317ab2063SBarry Smith sum = y[i]; 1664f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 166517ab2063SBarry Smith z[i] = sum; 166617ab2063SBarry Smith } 166702ab625aSSatish Balay #endif 1668f15663dcSBarry Smith } 16699566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16709566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16719566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 167417ab2063SBarry Smith } 167517ab2063SBarry Smith 167617ab2063SBarry Smith /* 167717ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 167817ab2063SBarry Smith */ 1679d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1680d71ae5a4SJacob Faibussowitsch { 1681416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1682d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1683c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 168417ab2063SBarry Smith 16853a40ed3dSBarry Smith PetscFunctionBegin; 168609f38230SBarry Smith if (!a->diag) { 16879566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1688c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 168909f38230SBarry Smith } 1690d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1691c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1692c0c07093SJunchao Zhang if (alreadySet) { 1693c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1694c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1695c0c07093SJunchao Zhang } 1696c0c07093SJunchao Zhang 169709f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1698bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1699bfeeae90SHong Zhang if (a->j[j] == i) { 170009f38230SBarry Smith a->diag[i] = j; 170117ab2063SBarry Smith break; 170217ab2063SBarry Smith } 170317ab2063SBarry Smith } 170417ab2063SBarry Smith } 17053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 170617ab2063SBarry Smith } 170717ab2063SBarry Smith 1708ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1709d71ae5a4SJacob Faibussowitsch { 171061ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 171161ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 171261ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 171361ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 171461ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 171561ecd0c6SBarry Smith 171661ecd0c6SBarry Smith PetscFunctionBegin; 171761ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17199566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 17203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 172161ecd0c6SBarry Smith } 172261ecd0c6SBarry Smith 172361ecd0c6SBarry Smith if (a->diagonaldense) { 172461ecd0c6SBarry Smith cnt = 0; 172561ecd0c6SBarry Smith } else { 17269566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 172761ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1728349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 172961ecd0c6SBarry Smith cnt++; 173061ecd0c6SBarry Smith mdiag[i] = 1; 173161ecd0c6SBarry Smith } 173261ecd0c6SBarry Smith } 173361ecd0c6SBarry Smith } 173461ecd0c6SBarry Smith if (!cnt) { 17359566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 173661ecd0c6SBarry Smith } else { 1737b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1738b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 173961ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij; 174061ecd0c6SBarry Smith 174161ecd0c6SBarry Smith a->a = NULL; 174261ecd0c6SBarry Smith a->j = NULL; 174361ecd0c6SBarry Smith a->i = NULL; 174461ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1745ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 174761ecd0c6SBarry Smith 174861ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 174961ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17509566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 175148a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1752447d62f5SStefano Zampini } 17539566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17549566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 175561ecd0c6SBarry Smith if (singlemalloc) { 17569566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda, oldj, oldi)); 175761ecd0c6SBarry Smith } else { 17589566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17599566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17609566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 176161ecd0c6SBarry Smith } 176261ecd0c6SBarry Smith } 17639566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 176461ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 17653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 176661ecd0c6SBarry Smith } 176761ecd0c6SBarry Smith 1768be5855fcSBarry Smith /* 1769be5855fcSBarry Smith Checks for missing diagonals 1770be5855fcSBarry Smith */ 1771d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1772d71ae5a4SJacob Faibussowitsch { 1773be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17747734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1775be5855fcSBarry Smith 1776be5855fcSBarry Smith PetscFunctionBegin; 177709f38230SBarry Smith *missing = PETSC_FALSE; 17787734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 177909f38230SBarry Smith *missing = PETSC_TRUE; 178009f38230SBarry Smith if (d) *d = 0; 17819566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 178209f38230SBarry Smith } else { 178301445905SHong Zhang PetscInt n; 178401445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1785f1e2ffcdSBarry Smith diag = a->diag; 178601445905SHong Zhang for (i = 0; i < n; i++) { 17877734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 178809f38230SBarry Smith *missing = PETSC_TRUE; 178909f38230SBarry Smith if (d) *d = i; 17909566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1791358d2f5dSShri Abhyankar break; 179209f38230SBarry Smith } 1793be5855fcSBarry Smith } 1794be5855fcSBarry Smith } 17953ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1796be5855fcSBarry Smith } 1797be5855fcSBarry Smith 17980da83c2eSBarry Smith #include <petscblaslapack.h> 17990da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18000da83c2eSBarry Smith 18010da83c2eSBarry Smith /* 18020da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18030da83c2eSBarry Smith */ 1804ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1805d71ae5a4SJacob Faibussowitsch { 18060da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18070da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18080da83c2eSBarry Smith const PetscReal shift = 0.0; 18090da83c2eSBarry Smith PetscInt ipvt[5]; 18104e208921SJed Brown PetscCount flops = 0; 18110da83c2eSBarry Smith PetscScalar work[25], *v_work; 18120da83c2eSBarry Smith 18130da83c2eSBarry Smith PetscFunctionBegin; 18140da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18150da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 181608401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1817ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 181948a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18200da83c2eSBarry Smith ncnt = 0; 18210da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18220da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18239566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18240da83c2eSBarry Smith switch (bsizes[i]) { 1825d71ae5a4SJacob Faibussowitsch case 1: 1826d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1827d71ae5a4SJacob Faibussowitsch break; 18280da83c2eSBarry Smith case 2: 18299566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18300da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18319566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18320da83c2eSBarry Smith break; 18330da83c2eSBarry Smith case 3: 18349566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18350da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18369566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18370da83c2eSBarry Smith break; 18380da83c2eSBarry Smith case 4: 18399566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18400da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18419566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18420da83c2eSBarry Smith break; 18430da83c2eSBarry Smith case 5: 18449566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18450da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18469566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18470da83c2eSBarry Smith break; 18480da83c2eSBarry Smith case 6: 18499566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18500da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18519566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18520da83c2eSBarry Smith break; 18530da83c2eSBarry Smith case 7: 18549566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18550da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18569566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18570da83c2eSBarry Smith break; 18580da83c2eSBarry Smith default: 18599566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18600da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18619566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18620da83c2eSBarry Smith } 18630da83c2eSBarry Smith ncnt += bsizes[i]; 18640da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 18654e208921SJed Brown flops += 2 * PetscPowInt(bsizes[i], 3) / 3; 18660da83c2eSBarry Smith } 18673ba16761SJacob Faibussowitsch PetscCall(PetscLogFlops(flops)); 186848a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18699566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18710da83c2eSBarry Smith } 18720da83c2eSBarry Smith 1873422a814eSBarry Smith /* 1874422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1875422a814eSBarry Smith */ 1876ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1877d71ae5a4SJacob Faibussowitsch { 187871f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1879d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18802e5835c6SStefano Zampini const MatScalar *v; 188154f21887SBarry Smith PetscScalar *idiag, *mdiag; 188271f1c65dSBarry Smith 188371f1c65dSBarry Smith PetscFunctionBegin; 18843ba16761SJacob Faibussowitsch if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS); 18859566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 188671f1c65dSBarry Smith diag = a->diag; 18874dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18882e5835c6SStefano Zampini 188971f1c65dSBarry Smith mdiag = a->mdiag; 189071f1c65dSBarry Smith idiag = a->idiag; 18919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1892422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 189371f1c65dSBarry Smith for (i = 0; i < m; i++) { 189471f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1895899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1896899639b0SHong Zhang if (PetscRealPart(fshift)) { 18979566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 18987b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18997b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19007b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 190198921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1902899639b0SHong Zhang } 190371f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 190471f1c65dSBarry Smith } 19059566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 190671f1c65dSBarry Smith } else { 190771f1c65dSBarry Smith for (i = 0; i < m; i++) { 190871f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 190971f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 191071f1c65dSBarry Smith } 19119566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 191271f1c65dSBarry Smith } 191371f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 19153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 191671f1c65dSBarry Smith } 191771f1c65dSBarry Smith 1918c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 1919d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1920d71ae5a4SJacob Faibussowitsch { 1921416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1922e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19232e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 192454f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19253d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 192697f1f81fSBarry Smith const PetscInt *idx, *diag; 192717ab2063SBarry Smith 19283a40ed3dSBarry Smith PetscFunctionBegin; 1929b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19309566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 19313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1932b215bc84SStefano Zampini } 1933b965ef7fSBarry Smith its = its * lits; 193491723122SBarry Smith 193571f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19369566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 193771f1c65dSBarry Smith a->fshift = fshift; 193871f1c65dSBarry Smith a->omega = omega; 1939ed480e8bSBarry Smith 194071f1c65dSBarry Smith diag = a->diag; 194171f1c65dSBarry Smith t = a->ssor_work; 1942ed480e8bSBarry Smith idiag = a->idiag; 194371f1c65dSBarry Smith mdiag = a->mdiag; 1944ed480e8bSBarry Smith 19459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19469566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19479566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1948ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 194917ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 195017ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1951ed480e8bSBarry Smith bs = b; 195217ab2063SBarry Smith for (i = 0; i < m; i++) { 195371f1c65dSBarry Smith d = fshift + mdiag[i]; 1954416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1955ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19562e5835c6SStefano Zampini v = aa + diag[i] + 1; 195717ab2063SBarry Smith sum = b[i] * d / omega; 1958003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 195917ab2063SBarry Smith x[i] = sum; 196017ab2063SBarry Smith } 19619566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19629566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19649566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 196617ab2063SBarry Smith } 1967c783ea89SBarry Smith 196808401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1969f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19704c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1971887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 197217ab2063SBarry Smith 197317ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 197417ab2063SBarry Smith 1975887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 197617ab2063SBarry Smith */ 197717ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 197817ab2063SBarry Smith 197917ab2063SBarry Smith /* x = (E + U)^{-1} b */ 198017ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1981416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1982ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19832e5835c6SStefano Zampini v = aa + diag[i] + 1; 198417ab2063SBarry Smith sum = b[i]; 1985e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1986ed480e8bSBarry Smith x[i] = sum * idiag[i]; 198717ab2063SBarry Smith } 198817ab2063SBarry Smith 198917ab2063SBarry Smith /* t = b - (2*E - D)x */ 19902e5835c6SStefano Zampini v = aa; 19912205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 199217ab2063SBarry Smith 199317ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1994ed480e8bSBarry Smith ts = t; 1995416022c9SBarry Smith diag = a->diag; 199617ab2063SBarry Smith for (i = 0; i < m; i++) { 1997416022c9SBarry Smith n = diag[i] - a->i[i]; 1998ed480e8bSBarry Smith idx = a->j + a->i[i]; 19992e5835c6SStefano Zampini v = aa + a->i[i]; 200017ab2063SBarry Smith sum = t[i]; 2001003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 2002ed480e8bSBarry Smith t[i] = sum * idiag[i]; 2003733d66baSBarry Smith /* x = x + t */ 2004733d66baSBarry Smith x[i] += t[i]; 200517ab2063SBarry Smith } 200617ab2063SBarry Smith 20079566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20089566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20099566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 201117ab2063SBarry Smith } 201217ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 201317ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 201417ab2063SBarry Smith for (i = 0; i < m; i++) { 2015416022c9SBarry Smith n = diag[i] - a->i[i]; 2016ed480e8bSBarry Smith idx = a->j + a->i[i]; 20172e5835c6SStefano Zampini v = aa + a->i[i]; 201817ab2063SBarry Smith sum = b[i]; 2019e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20205c99c7daSBarry Smith t[i] = sum; 2021ed480e8bSBarry Smith x[i] = sum * idiag[i]; 202217ab2063SBarry Smith } 20235c99c7daSBarry Smith xb = t; 20249566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20253a40ed3dSBarry Smith } else xb = b; 202617ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 202717ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2028416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2029ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20302e5835c6SStefano Zampini v = aa + diag[i] + 1; 203117ab2063SBarry Smith sum = xb[i]; 2032e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20335c99c7daSBarry Smith if (xb == b) { 2034ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20355c99c7daSBarry Smith } else { 2036b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 203717ab2063SBarry Smith } 20385c99c7daSBarry Smith } 20399566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 204017ab2063SBarry Smith } 204117ab2063SBarry Smith its--; 204217ab2063SBarry Smith } 204317ab2063SBarry Smith while (its--) { 204417ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 204517ab2063SBarry Smith for (i = 0; i < m; i++) { 2046b19a5dc2SMark Adams /* lower */ 2047b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2048ed480e8bSBarry Smith idx = a->j + a->i[i]; 20492e5835c6SStefano Zampini v = aa + a->i[i]; 205017ab2063SBarry Smith sum = b[i]; 2051e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2052b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2053b19a5dc2SMark Adams /* upper */ 2054b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2055b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20562e5835c6SStefano Zampini v = aa + diag[i] + 1; 2057b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2058b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 205917ab2063SBarry Smith } 2060b19a5dc2SMark Adams xb = t; 20619566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2062b19a5dc2SMark Adams } else xb = b; 206317ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 206417ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2065b19a5dc2SMark Adams sum = xb[i]; 2066b19a5dc2SMark Adams if (xb == b) { 2067b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2068416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2069ed480e8bSBarry Smith idx = a->j + a->i[i]; 20702e5835c6SStefano Zampini v = aa + a->i[i]; 2071e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2072ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2073b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2074b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2075b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20762e5835c6SStefano Zampini v = aa + diag[i] + 1; 2077b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2078b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 207917ab2063SBarry Smith } 2080b19a5dc2SMark Adams } 2081b19a5dc2SMark Adams if (xb == b) { 20829566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2083b19a5dc2SMark Adams } else { 20849566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2085b19a5dc2SMark Adams } 208617ab2063SBarry Smith } 208717ab2063SBarry Smith } 20889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20899566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20909566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 209217ab2063SBarry Smith } 209317ab2063SBarry Smith 2094ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2095d71ae5a4SJacob Faibussowitsch { 2096416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 20974e220ebcSLois Curfman McInnes 20983a40ed3dSBarry Smith PetscFunctionBegin; 20994e220ebcSLois Curfman McInnes info->block_size = 1.0; 21003966268fSBarry Smith info->nz_allocated = a->maxnz; 21013966268fSBarry Smith info->nz_used = a->nz; 21023966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21033966268fSBarry Smith info->assemblies = A->num_ass; 21043966268fSBarry Smith info->mallocs = A->info.mallocs; 21054dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2106d5f3da31SBarry Smith if (A->factortype) { 21074e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21084e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21094e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21104e220ebcSLois Curfman McInnes } else { 21114e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21124e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21134e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21144e220ebcSLois Curfman McInnes } 21153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 211617ab2063SBarry Smith } 211717ab2063SBarry Smith 2118ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2119d71ae5a4SJacob Faibussowitsch { 2120416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2121c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 212297b48c8fSBarry Smith const PetscScalar *xx; 21232e5835c6SStefano Zampini PetscScalar *bb, *aa; 2124c7da8527SEric Chamberland PetscInt d = 0; 212517ab2063SBarry Smith 21263a40ed3dSBarry Smith PetscFunctionBegin; 212797b48c8fSBarry Smith if (x && b) { 21289566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21299566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 213097b48c8fSBarry Smith for (i = 0; i < N; i++) { 2131aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2132447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 213397b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 213497b48c8fSBarry Smith } 21359566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21369566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 213797b48c8fSBarry Smith } 213897b48c8fSBarry Smith 21399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2140a9817697SBarry Smith if (a->keepnonzeropattern) { 2141f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2142aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21439566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2144f1e2ffcdSBarry Smith } 2145f4df32b1SMatthew Knepley if (diag != 0.0) { 2146c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2147c7da8527SEric Chamberland d = rows[i]; 2148447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 214908401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2150c7da8527SEric Chamberland } 2151f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2152447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21532e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2154f1e2ffcdSBarry Smith } 2155f1e2ffcdSBarry Smith } 2156f1e2ffcdSBarry Smith } else { 2157f4df32b1SMatthew Knepley if (diag != 0.0) { 215817ab2063SBarry Smith for (i = 0; i < N; i++) { 2159aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21607ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2161447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2162447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2163447d62f5SStefano Zampini } else { 2164416022c9SBarry Smith a->ilen[rows[i]] = 1; 21652e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2166bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2167447d62f5SStefano Zampini } 2168447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21699566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 217017ab2063SBarry Smith } 217117ab2063SBarry Smith } 21723a40ed3dSBarry Smith } else { 217317ab2063SBarry Smith for (i = 0; i < N; i++) { 2174aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2175416022c9SBarry Smith a->ilen[rows[i]] = 0; 217617ab2063SBarry Smith } 217717ab2063SBarry Smith } 2178e56f5c9eSBarry Smith A->nonzerostate++; 2179f1e2ffcdSBarry Smith } 21809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2181dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 218317ab2063SBarry Smith } 218417ab2063SBarry Smith 2185ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2186d71ae5a4SJacob Faibussowitsch { 21876e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21886e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21892b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 21906e169961SBarry Smith const PetscScalar *xx; 21912e5835c6SStefano Zampini PetscScalar *bb, *aa; 21926e169961SBarry Smith 21936e169961SBarry Smith PetscFunctionBegin; 21943ba16761SJacob Faibussowitsch if (!N) PetscFunctionReturn(PETSC_SUCCESS); 21959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 21966e169961SBarry Smith if (x && b) { 21979566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21989566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 21992b40b63fSBarry Smith vecs = PETSC_TRUE; 22006e169961SBarry Smith } 22019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 22026e169961SBarry Smith for (i = 0; i < N; i++) { 2203aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 22049566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 22052205254eSKarl Rupp 22066e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22076e169961SBarry Smith } 22086e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22096e169961SBarry Smith if (!zeroed[i]) { 22106e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22114cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22122e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22132e5835c6SStefano Zampini aa[j] = 0.0; 22146e169961SBarry Smith } 22156e169961SBarry Smith } 22164cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22176e169961SBarry Smith } 22186e169961SBarry Smith if (x && b) { 22199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22209566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22216e169961SBarry Smith } 22229566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22236e169961SBarry Smith if (diag != 0.0) { 22249566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22251d5a398dSstefano_zampini if (missing) { 22261d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22274cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2228aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22299566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22301d5a398dSstefano_zampini } 22311d5a398dSstefano_zampini } else { 2232ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22336e169961SBarry Smith } 22341d5a398dSstefano_zampini } 22359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2236dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22386e169961SBarry Smith } 22396e169961SBarry Smith 2240d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2241d71ae5a4SJacob Faibussowitsch { 2242fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2243fff043a9SJunchao Zhang const PetscScalar *aa; 224417ab2063SBarry Smith 22453a40ed3dSBarry Smith PetscFunctionBegin; 22469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2247416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22485c0db29aSPierre Jolivet if (v) *v = aa ? (PetscScalar *)(aa + a->i[row]) : NULL; 224917ab2063SBarry Smith if (idx) { 22505c0db29aSPierre Jolivet if (*nz && a->j) *idx = a->j + a->i[row]; 2251f4259b30SLisandro Dalcin else *idx = NULL; 225217ab2063SBarry Smith } 22539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225517ab2063SBarry Smith } 225617ab2063SBarry Smith 2257d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2258d71ae5a4SJacob Faibussowitsch { 22593a40ed3dSBarry Smith PetscFunctionBegin; 2260cb4a9cd9SHong Zhang if (nz) *nz = 0; 22612e5835c6SStefano Zampini if (idx) *idx = NULL; 22622e5835c6SStefano Zampini if (v) *v = NULL; 22633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 226417ab2063SBarry Smith } 226517ab2063SBarry Smith 2266ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2267d71ae5a4SJacob Faibussowitsch { 2268416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22692e5835c6SStefano Zampini const MatScalar *v; 227036db0b34SBarry Smith PetscReal sum = 0.0; 227197f1f81fSBarry Smith PetscInt i, j; 227217ab2063SBarry Smith 22733a40ed3dSBarry Smith PetscFunctionBegin; 22749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 227517ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2276570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2277570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2278792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2279570b7f6dSBarry Smith #else 2280416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22819371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22829371c9d4SSatish Balay v++; 228317ab2063SBarry Smith } 22848f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2285570b7f6dSBarry Smith #endif 22869566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22873a40ed3dSBarry Smith } else if (type == NORM_1) { 228836db0b34SBarry Smith PetscReal *tmp; 228997f1f81fSBarry Smith PetscInt *jj = a->j; 22909566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2291064f8208SBarry Smith *nrm = 0.0; 2292416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 22939371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 22949371c9d4SSatish Balay v++; 229517ab2063SBarry Smith } 2296d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2297064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 229817ab2063SBarry Smith } 22999566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 23009566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 23013a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2302064f8208SBarry Smith *nrm = 0.0; 2303d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 23042e5835c6SStefano Zampini const PetscScalar *v2 = v + a->i[j]; 230517ab2063SBarry Smith sum = 0.0; 2306416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23079371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23089371c9d4SSatish Balay v2++; 230917ab2063SBarry Smith } 2310064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 231117ab2063SBarry Smith } 23129566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2313f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 231617ab2063SBarry Smith } 231717ab2063SBarry Smith 2318ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2319d71ae5a4SJacob Faibussowitsch { 23203d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 232154f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23222e5835c6SStefano Zampini const MatScalar *va, *vb; 232397f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2324cd0d46ebSvictorle 2325cd0d46ebSvictorle PetscFunctionBegin; 23269566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23279566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23285485867bSBarry Smith if (ma != nb || na != mb) { 23295485867bSBarry Smith *f = PETSC_FALSE; 23303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23315485867bSBarry Smith } 23329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23349371c9d4SSatish Balay aii = aij->i; 23359371c9d4SSatish Balay bii = bij->i; 23369371c9d4SSatish Balay adx = aij->j; 23379371c9d4SSatish Balay bdx = bij->j; 23389566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23399566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2340cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2341cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2342cd0d46ebSvictorle 2343cd0d46ebSvictorle *f = PETSC_TRUE; 2344cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2345cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 234697f1f81fSBarry Smith PetscInt idc, idr; 23475485867bSBarry Smith PetscScalar vc, vr; 2348cd0d46ebSvictorle /* column/row index/value */ 23495485867bSBarry Smith idc = adx[aptr[i]]; 23505485867bSBarry Smith idr = bdx[bptr[idc]]; 23515485867bSBarry Smith vc = va[aptr[i]]; 23525485867bSBarry Smith vr = vb[bptr[idc]]; 23535485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23545485867bSBarry Smith *f = PETSC_FALSE; 23555485867bSBarry Smith goto done; 2356cd0d46ebSvictorle } else { 23575485867bSBarry Smith aptr[i]++; 23585485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2359cd0d46ebSvictorle } 2360cd0d46ebSvictorle } 2361cd0d46ebSvictorle } 2362cd0d46ebSvictorle done: 23639566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23649566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 23673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2368cd0d46ebSvictorle } 2369cd0d46ebSvictorle 2370ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2371d71ae5a4SJacob Faibussowitsch { 23723d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 237354f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 237454f21887SBarry Smith MatScalar *va, *vb; 23751cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23761cbb95d3SBarry Smith 23771cbb95d3SBarry Smith PetscFunctionBegin; 23789566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23799566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23801cbb95d3SBarry Smith if (ma != nb || na != mb) { 23811cbb95d3SBarry Smith *f = PETSC_FALSE; 23823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23831cbb95d3SBarry Smith } 23849371c9d4SSatish Balay aii = aij->i; 23859371c9d4SSatish Balay bii = bij->i; 23869371c9d4SSatish Balay adx = aij->j; 23879371c9d4SSatish Balay bdx = bij->j; 23889371c9d4SSatish Balay va = aij->a; 23899371c9d4SSatish Balay vb = bij->a; 23909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23919566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23921cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 23931cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 23941cbb95d3SBarry Smith 23951cbb95d3SBarry Smith *f = PETSC_TRUE; 23961cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 23971cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 23981cbb95d3SBarry Smith PetscInt idc, idr; 23991cbb95d3SBarry Smith PetscScalar vc, vr; 24001cbb95d3SBarry Smith /* column/row index/value */ 24011cbb95d3SBarry Smith idc = adx[aptr[i]]; 24021cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24031cbb95d3SBarry Smith vc = va[aptr[i]]; 24041cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24051cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24061cbb95d3SBarry Smith *f = PETSC_FALSE; 24071cbb95d3SBarry Smith goto done; 24081cbb95d3SBarry Smith } else { 24091cbb95d3SBarry Smith aptr[i]++; 24101cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24111cbb95d3SBarry Smith } 24121cbb95d3SBarry Smith } 24131cbb95d3SBarry Smith } 24141cbb95d3SBarry Smith done: 24159566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24169566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24181cbb95d3SBarry Smith } 24191cbb95d3SBarry Smith 2420ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2421d71ae5a4SJacob Faibussowitsch { 24229e29f15eSvictorle PetscFunctionBegin; 24239566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f)); 24243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24259e29f15eSvictorle } 24269e29f15eSvictorle 2427ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2428d71ae5a4SJacob Faibussowitsch { 24291cbb95d3SBarry Smith PetscFunctionBegin; 24309566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f)); 24313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24321cbb95d3SBarry Smith } 24331cbb95d3SBarry Smith 2434d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2435d71ae5a4SJacob Faibussowitsch { 2436416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2437fff8e43fSBarry Smith const PetscScalar *l, *r; 2438fff8e43fSBarry Smith PetscScalar x; 243954f21887SBarry Smith MatScalar *v; 2440fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2441fff8e43fSBarry Smith const PetscInt *jj; 244217ab2063SBarry Smith 24433a40ed3dSBarry Smith PetscFunctionBegin; 244417ab2063SBarry Smith if (ll) { 24453ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24463ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24479566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 244808401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24499566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 245117ab2063SBarry Smith for (i = 0; i < m; i++) { 245217ab2063SBarry Smith x = l[i]; 2453416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24542205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 245517ab2063SBarry Smith } 24569566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24579566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 245917ab2063SBarry Smith } 246017ab2063SBarry Smith if (rr) { 24619566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 246208401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24639566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24652e5835c6SStefano Zampini jj = a->j; 24662205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24689566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24699566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 247017ab2063SBarry Smith } 24719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 247317ab2063SBarry Smith } 247417ab2063SBarry Smith 2475d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2476d71ae5a4SJacob Faibussowitsch { 2477db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2478d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 247997f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24805d0c19d7SBarry Smith const PetscInt *irow, *icol; 24812e5835c6SStefano Zampini const PetscScalar *aa; 24825d0c19d7SBarry Smith PetscInt nrows, ncols; 248397f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 2484fb3c7e2dSJunchao Zhang MatScalar *a_new, *mat_a, *c_a; 2485416022c9SBarry Smith Mat C; 2486cdc6f3adSToby Isaac PetscBool stride; 248717ab2063SBarry Smith 24883a40ed3dSBarry Smith PetscFunctionBegin; 24899566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24909566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24919566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 249217ab2063SBarry Smith 24939566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2494ff718158SBarry Smith if (stride) { 24959566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2496ff718158SBarry Smith } else { 2497ff718158SBarry Smith first = 0; 2498ff718158SBarry Smith step = 0; 2499ff718158SBarry Smith } 2500fee21e36SBarry Smith if (stride && step == 1) { 250102834360SBarry Smith /* special case of contiguous rows */ 25029566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 250302834360SBarry Smith /* loop over new rows determining lens and starting points */ 250402834360SBarry Smith for (i = 0; i < nrows; i++) { 2505bfeeae90SHong Zhang kstart = ai[irow[i]]; 2506a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2507a91a9bebSLisandro Dalcin starts[i] = kstart; 250802834360SBarry Smith for (k = kstart; k < kend; k++) { 2509bfeeae90SHong Zhang if (aj[k] >= first) { 251002834360SBarry Smith starts[i] = k; 251102834360SBarry Smith break; 251202834360SBarry Smith } 251302834360SBarry Smith } 2514a2744918SBarry Smith sum = 0; 251502834360SBarry Smith while (k < kend) { 2516bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2517a2744918SBarry Smith sum++; 251802834360SBarry Smith } 2519a2744918SBarry Smith lens[i] = sum; 252002834360SBarry Smith } 252102834360SBarry Smith /* create submatrix */ 2522cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 252397f1f81fSBarry Smith PetscInt n_cols, n_rows; 25249566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2525aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25269566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 252708480c60SBarry Smith C = *B; 25283a40ed3dSBarry Smith } else { 25293bef6203SJed Brown PetscInt rbs, cbs; 25309566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25319566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25329566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25339566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25349566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25359566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 253708480c60SBarry Smith } 2538db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2539db02288aSLois Curfman McInnes 254002834360SBarry Smith /* loop over rows inserting into submatrix */ 2541fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C 2542db02288aSLois Curfman McInnes j_new = c->j; 2543db02288aSLois Curfman McInnes i_new = c->i; 25449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 254502834360SBarry Smith for (i = 0; i < nrows; i++) { 2546a2744918SBarry Smith ii = starts[i]; 2547a2744918SBarry Smith lensi = lens[i]; 2548ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25499566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2550a2744918SBarry Smith a_new += lensi; 2551a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2552a2744918SBarry Smith c->ilen[i] = lensi; 255302834360SBarry Smith } 2554fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly 25559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25569566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25573a40ed3dSBarry Smith } else { 25589566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25599566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25609566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25614dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25626bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25634dcab191SBarry Smith smap[icol[i]] = i + 1; 25644dcab191SBarry Smith } 25654dcab191SBarry Smith 256602834360SBarry Smith /* determine lens of each row */ 256702834360SBarry Smith for (i = 0; i < nrows; i++) { 2568bfeeae90SHong Zhang kstart = ai[irow[i]]; 256902834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 257002834360SBarry Smith lens[i] = 0; 257102834360SBarry Smith for (k = kstart; k < kend; k++) { 2572ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 257302834360SBarry Smith } 257402834360SBarry Smith } 257517ab2063SBarry Smith /* Create and fill new matrix */ 2576a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2577ace3abfcSBarry Smith PetscBool equal; 25780f5bd95cSBarry Smith 257999141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2580aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25819566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 2582*fdfbdca6SPierre Jolivet PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros"); 25839566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 258408480c60SBarry Smith C = *B; 25853a40ed3dSBarry Smith } else { 25863bef6203SJed Brown PetscInt rbs, cbs; 25879566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25889566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25899566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25909566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25919566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25929566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 259408480c60SBarry Smith } 25959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2596fb3c7e2dSJunchao Zhang 259799141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 2598fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C 259917ab2063SBarry Smith for (i = 0; i < nrows; i++) { 260099141d43SSatish Balay row = irow[i]; 2601bfeeae90SHong Zhang kstart = ai[row]; 260299141d43SSatish Balay kend = kstart + a->ilen[row]; 2603bfeeae90SHong Zhang mat_i = c->i[i]; 260499141d43SSatish Balay mat_j = c->j + mat_i; 2605fb3c7e2dSJunchao Zhang mat_a = c_a + mat_i; 260699141d43SSatish Balay mat_ilen = c->ilen + i; 260717ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2608bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2609ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26102e5835c6SStefano Zampini *mat_a++ = aa[k]; 261199141d43SSatish Balay (*mat_ilen)++; 261217ab2063SBarry Smith } 261317ab2063SBarry Smith } 261417ab2063SBarry Smith } 26159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 261602834360SBarry Smith /* Free work space */ 26179566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26189566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26199566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2620cdc6f3adSToby Isaac /* sort */ 2621cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2622cdc6f3adSToby Isaac PetscInt ilen; 2623cdc6f3adSToby Isaac 2624cdc6f3adSToby Isaac mat_i = c->i[i]; 2625cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2626fb3c7e2dSJunchao Zhang mat_a = c_a + mat_i; 2627cdc6f3adSToby Isaac ilen = c->ilen[i]; 26289566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2629cdc6f3adSToby Isaac } 2630fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a)); 263102834360SBarry Smith } 26328c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26339566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2634305c6ccfSStefano Zampini #endif 26359566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26369566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 263717ab2063SBarry Smith 26389566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2639416022c9SBarry Smith *B = C; 26403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 264117ab2063SBarry Smith } 264217ab2063SBarry Smith 2643ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2644d71ae5a4SJacob Faibussowitsch { 264582d44351SHong Zhang Mat B; 264682d44351SHong Zhang 264782d44351SHong Zhang PetscFunctionBegin; 2648c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26499566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26509566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26519566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26529566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26539566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 265482d44351SHong Zhang *subMat = B; 2655c2d650bdSHong Zhang } else { 26569566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2657c2d650bdSHong Zhang } 26583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 265982d44351SHong Zhang } 266082d44351SHong Zhang 2661ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2662d71ae5a4SJacob Faibussowitsch { 266363b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 266463b91edcSBarry Smith Mat outA; 2665ace3abfcSBarry Smith PetscBool row_identity, col_identity; 266663b91edcSBarry Smith 26673a40ed3dSBarry Smith PetscFunctionBegin; 266808401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26691df811f5SHong Zhang 26709566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26719566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2672a871dcd8SBarry Smith 267363b91edcSBarry Smith outA = inA; 2674d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26759566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26769566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26772205254eSKarl Rupp 26789566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26799566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26802205254eSKarl Rupp 2681c3122656SLisandro Dalcin a->row = row; 26822205254eSKarl Rupp 26839566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26849566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26852205254eSKarl Rupp 2686c3122656SLisandro Dalcin a->col = col; 268763b91edcSBarry Smith 268836db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26899566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26909566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2691f0ec6fceSSatish Balay 269294a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26939566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 269494a9d846SBarry Smith } 269563b91edcSBarry Smith 26969566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2697137fb511SHong Zhang if (row_identity && col_identity) { 26989566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2699137fb511SHong Zhang } else { 27009566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2701137fb511SHong Zhang } 27023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2703a871dcd8SBarry Smith } 2704a871dcd8SBarry Smith 2705d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2706d71ae5a4SJacob Faibussowitsch { 2707f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2708dfa0f9e5SStefano Zampini PetscScalar *v; 2709c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 27103a40ed3dSBarry Smith 27113a40ed3dSBarry Smith PetscFunctionBegin; 27129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27139566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2714792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27159566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2719f0b747eeSBarry Smith } 2720f0b747eeSBarry Smith 2721d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2722d71ae5a4SJacob Faibussowitsch { 272316b64355SHong Zhang PetscInt i; 272416b64355SHong Zhang 272516b64355SHong Zhang PetscFunctionBegin; 272616b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27279566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 272816b64355SHong Zhang 272948a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27309566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 273116b64355SHong Zhang 273216b64355SHong Zhang if (submatj->rbuf1) { 27339566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27349566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 273516b64355SHong Zhang } 273616b64355SHong Zhang 273748a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27389566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27399566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 274016b64355SHong Zhang } 274116b64355SHong Zhang 274216b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2743eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 27449566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27459566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 274616b64355SHong Zhang #else 27479566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 274816b64355SHong Zhang #endif 274916b64355SHong Zhang 275016b64355SHong Zhang if (!submatj->allcolumns) { 275116b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2752eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap)); 275316b64355SHong Zhang #else 27549566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 275516b64355SHong Zhang #endif 275616b64355SHong Zhang } 27579566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 275816b64355SHong Zhang 27599566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 27603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 276116b64355SHong Zhang } 276216b64355SHong Zhang 2763d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2764d71ae5a4SJacob Faibussowitsch { 276516b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27665c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 276716b64355SHong Zhang 276816b64355SHong Zhang PetscFunctionBegin; 27699566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27709566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 277216b64355SHong Zhang } 277316b64355SHong Zhang 277489a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2775ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2776d71ae5a4SJacob Faibussowitsch { 27772d033e1fSHong Zhang PetscInt i; 27780fb991dcSHong Zhang Mat C; 27790fb991dcSHong Zhang Mat_SeqAIJ *c; 27800fb991dcSHong Zhang Mat_SubSppt *submatj; 27812d033e1fSHong Zhang 27822d033e1fSHong Zhang PetscFunctionBegin; 27832d033e1fSHong Zhang for (i = 0; i < n; i++) { 27840fb991dcSHong Zhang C = (*mat)[i]; 27850fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27860fb991dcSHong Zhang submatj = c->submatis1; 27872d033e1fSHong Zhang if (submatj) { 2788682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 278926cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27909566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27919566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27929566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27933faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27949566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27959566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27969566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2797682e4c99SStefano Zampini } 27982d033e1fSHong Zhang } else { 27999566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 28002d033e1fSHong Zhang } 28012d033e1fSHong Zhang } 280286e85357SHong Zhang 280363a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 28049566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 280563a75b2aSHong Zhang 28069566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 28073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28082d033e1fSHong Zhang } 28092d033e1fSHong Zhang 2810ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2811d71ae5a4SJacob Faibussowitsch { 281297f1f81fSBarry Smith PetscInt i; 2813cddf8d76SBarry Smith 28143a40ed3dSBarry Smith PetscFunctionBegin; 281548a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2816cddf8d76SBarry Smith 281748a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2819cddf8d76SBarry Smith } 2820cddf8d76SBarry Smith 2821ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2822d71ae5a4SJacob Faibussowitsch { 2823e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28249a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28255d0c19d7SBarry Smith const PetscInt *idx; 28269a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2827f1af5d2fSBarry Smith PetscBT table; 2828bbd702dbSSatish Balay 28293a40ed3dSBarry Smith PetscFunctionBegin; 28309a88ca10SBarry Smith m = A->rmap->n / bs; 2831e4d965acSSatish Balay ai = a->i; 2832bfeeae90SHong Zhang aj = a->j; 28338a047759SSatish Balay 283408401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 283506763907SSatish Balay 28369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28379566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 283806763907SSatish Balay 2839e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2840b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2841e4d965acSSatish Balay isz = 0; 28429566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2843e4d965acSSatish Balay 2844e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28459566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28469566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2847e4d965acSSatish Balay 28489a88ca10SBarry Smith if (bs > 1) { 28499a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28509a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28519a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28529a88ca10SBarry Smith } 28539a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28549a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28559a88ca10SBarry Smith 28569a88ca10SBarry Smith k = 0; 28579a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28589a88ca10SBarry Smith n = isz; 28599a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28609a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28619a88ca10SBarry Smith row = bs * nidx[k] + ll; 28629a88ca10SBarry Smith start = ai[row]; 28639a88ca10SBarry Smith end = ai[row + 1]; 28649a88ca10SBarry Smith for (l = start; l < end; l++) { 28659a88ca10SBarry Smith val = aj[l] / bs; 28669a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28679a88ca10SBarry Smith } 28689a88ca10SBarry Smith } 28699a88ca10SBarry Smith } 28709a88ca10SBarry Smith } 28719a88ca10SBarry Smith PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i))); 28729a88ca10SBarry Smith } else { 2873dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2874e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28752205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28764dcbc457SBarry Smith } 28779566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28789566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2879e4d965acSSatish Balay 288004a348a9SBarry Smith k = 0; 288104a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 288204a348a9SBarry Smith n = isz; 288306763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2884e4d965acSSatish Balay row = nidx[k]; 2885e4d965acSSatish Balay start = ai[row]; 2886e4d965acSSatish Balay end = ai[row + 1]; 288704a348a9SBarry Smith for (l = start; l < end; l++) { 2888efb16452SHong Zhang val = aj[l]; 28892205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2890e4d965acSSatish Balay } 2891e4d965acSSatish Balay } 2892e4d965acSSatish Balay } 28939566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2894e4d965acSSatish Balay } 28959a88ca10SBarry Smith } 28969566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28979566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28994dcbc457SBarry Smith } 290017ab2063SBarry Smith 2901ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2902d71ae5a4SJacob Faibussowitsch { 29030513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29043b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 29055d0c19d7SBarry Smith const PetscInt *row, *col; 29065d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 290756cd22aeSBarry Smith IS icolp, irowp; 29080298fd71SBarry Smith PetscInt *cwork = NULL; 29090298fd71SBarry Smith PetscScalar *vwork = NULL; 29100513a670SBarry Smith 29113a40ed3dSBarry Smith PetscFunctionBegin; 29129566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29139566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29149566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29159566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29160513a670SBarry Smith 29170513a670SBarry Smith /* determine lengths of permuted rows */ 29189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29192205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29209566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29219566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29229566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29239566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29259566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29260513a670SBarry Smith 29279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29280513a670SBarry Smith for (i = 0; i < m; i++) { 29299566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29302205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29319566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29329566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29330513a670SBarry Smith } 29349566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29352205254eSKarl Rupp 29363c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29372205254eSKarl Rupp 29388c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29399566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29409fe5e383SStefano Zampini #endif 29419566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29429566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29439566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29449566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29459566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29469566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 294748a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29490513a670SBarry Smith } 29500513a670SBarry Smith 2951d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2952d71ae5a4SJacob Faibussowitsch { 2953cb5b572fSBarry Smith PetscFunctionBegin; 295433f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 295533f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2956be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2957be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29582e5835c6SStefano Zampini const PetscScalar *aa; 2959be6bf707SBarry Smith 29609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 296108401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29629566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29639566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2965cb5b572fSBarry Smith } else { 29669566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2967cb5b572fSBarry Smith } 29683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2969cb5b572fSBarry Smith } 2970cb5b572fSBarry Smith 2971d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2972d71ae5a4SJacob Faibussowitsch { 29736c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29746e111a19SKarl Rupp 29756c0721eeSBarry Smith PetscFunctionBegin; 29766c0721eeSBarry Smith *array = a->a; 29773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29786c0721eeSBarry Smith } 29796c0721eeSBarry Smith 2980d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2981d71ae5a4SJacob Faibussowitsch { 29826c0721eeSBarry Smith PetscFunctionBegin; 2983f38c1e66SStefano Zampini *array = NULL; 29843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29856c0721eeSBarry Smith } 2986273d9f13SBarry Smith 29878229c054SShri Abhyankar /* 29888229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29898229c054SShri Abhyankar have different nonzero structure. 29908229c054SShri Abhyankar */ 2991d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2992d71ae5a4SJacob Faibussowitsch { 2993b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2994ec7775f6SShri Abhyankar 2995ec7775f6SShri Abhyankar PetscFunctionBegin; 2996ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2997ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 2998b264fe52SHong Zhang const PetscInt *xjj = xj + xi[i], *yjj = yj + yi[i]; 2999b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 3000b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 30018af7cee1SJed Brown nnz[i] = 0; 30028af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 3003b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 3004b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 30058af7cee1SJed Brown nnz[i]++; 30068af7cee1SJed Brown } 30078af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 3008ec7775f6SShri Abhyankar } 30093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3010ec7775f6SShri Abhyankar } 3011ec7775f6SShri Abhyankar 3012d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3013d71ae5a4SJacob Faibussowitsch { 3014b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3015b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3016b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3017b264fe52SHong Zhang 3018b264fe52SHong Zhang PetscFunctionBegin; 3019b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30209566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 30213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3022b264fe52SHong Zhang } 3023b264fe52SHong Zhang 3024d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3025d71ae5a4SJacob Faibussowitsch { 3026ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3027ac90fabeSBarry Smith 3028ac90fabeSBarry Smith PetscFunctionBegin; 3029134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3030134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3031134adf20SPierre Jolivet if (e) { 30329566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 303381fa06acSBarry Smith if (e) { 30349566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3035134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 303681fa06acSBarry Smith } 303781fa06acSBarry Smith } 303854c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 303981fa06acSBarry Smith } 3040ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30412e5835c6SStefano Zampini const PetscScalar *xa; 30422e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 304381fa06acSBarry Smith PetscBLASInt one = 1, bnz; 304481fa06acSBarry Smith 30459566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3048792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30519566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30539566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3054ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30559566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3056ac90fabeSBarry Smith } else { 30578229c054SShri Abhyankar Mat B; 30588229c054SShri Abhyankar PetscInt *nnz; 30599566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30609566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30619566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30629566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30639566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30649566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30669566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30679566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30689bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30699566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3070ac90fabeSBarry Smith } 30713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3072ac90fabeSBarry Smith } 3073ac90fabeSBarry Smith 3074d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3075d71ae5a4SJacob Faibussowitsch { 3076354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3077354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3078354c94deSBarry Smith PetscInt i, nz; 3079354c94deSBarry Smith PetscScalar *a; 3080354c94deSBarry Smith 3081354c94deSBarry Smith PetscFunctionBegin; 3082354c94deSBarry Smith nz = aij->nz; 30839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30842205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3086354c94deSBarry Smith #else 3087354c94deSBarry Smith PetscFunctionBegin; 3088354c94deSBarry Smith #endif 30893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3090354c94deSBarry Smith } 3091354c94deSBarry Smith 3092ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3093d71ae5a4SJacob Faibussowitsch { 3094e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3095d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3096e34fafa9SBarry Smith PetscReal atmp; 3097985db425SBarry Smith PetscScalar *x; 3098ce496241SStefano Zampini const MatScalar *aa, *av; 3099e34fafa9SBarry Smith 3100e34fafa9SBarry Smith PetscFunctionBegin; 310128b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3103ce496241SStefano Zampini aa = av; 3104e34fafa9SBarry Smith ai = a->i; 3105e34fafa9SBarry Smith aj = a->j; 3106e34fafa9SBarry Smith 31079566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31089566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31099566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 311008401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3111e34fafa9SBarry Smith for (i = 0; i < m; i++) { 31129371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31139371c9d4SSatish Balay ai++; 3114e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3115985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31169371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31179371c9d4SSatish Balay x[i] = atmp; 31189371c9d4SSatish Balay if (idx) idx[i] = *aj; 31199371c9d4SSatish Balay } 31209371c9d4SSatish Balay aa++; 31219371c9d4SSatish Balay aj++; 3122985db425SBarry Smith } 3123985db425SBarry Smith } 31249566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3127985db425SBarry Smith } 3128985db425SBarry Smith 3129ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3130d71ae5a4SJacob Faibussowitsch { 3131985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3132d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3133985db425SBarry Smith PetscScalar *x; 3134ce496241SStefano Zampini const MatScalar *aa, *av; 3135985db425SBarry Smith 3136985db425SBarry Smith PetscFunctionBegin; 313728b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3139ce496241SStefano Zampini aa = av; 3140985db425SBarry Smith ai = a->i; 3141985db425SBarry Smith aj = a->j; 3142985db425SBarry Smith 31439566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31449566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31459566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 314608401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3147985db425SBarry Smith for (i = 0; i < m; i++) { 31489371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31499371c9d4SSatish Balay ai++; 3150d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31519371c9d4SSatish Balay x[i] = *aa; 31529371c9d4SSatish Balay if (idx) idx[i] = 0; 3153985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3154985db425SBarry Smith x[i] = 0.0; 3155985db425SBarry Smith if (idx) { 3156985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3157985db425SBarry Smith if (aj[j] > j) { 3158985db425SBarry Smith idx[i] = j; 3159985db425SBarry Smith break; 3160985db425SBarry Smith } 3161985db425SBarry Smith } 31621a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31631a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3164985db425SBarry Smith } 3165985db425SBarry Smith } 3166985db425SBarry Smith for (j = 0; j < ncols; j++) { 31679371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31689371c9d4SSatish Balay x[i] = *aa; 31699371c9d4SSatish Balay if (idx) idx[i] = *aj; 31709371c9d4SSatish Balay } 31719371c9d4SSatish Balay aa++; 31729371c9d4SSatish Balay aj++; 3173985db425SBarry Smith } 3174985db425SBarry Smith } 31759566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3178985db425SBarry Smith } 3179985db425SBarry Smith 3180ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3181d71ae5a4SJacob Faibussowitsch { 3182c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3183c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3184ce496241SStefano Zampini PetscScalar *x; 3185ce496241SStefano Zampini const MatScalar *aa, *av; 3186c87e5d42SMatthew Knepley 3187c87e5d42SMatthew Knepley PetscFunctionBegin; 31889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3189ce496241SStefano Zampini aa = av; 3190c87e5d42SMatthew Knepley ai = a->i; 3191c87e5d42SMatthew Knepley aj = a->j; 3192c87e5d42SMatthew Knepley 31939566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31949566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31959566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 319608401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3197c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 31989371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31999371c9d4SSatish Balay ai++; 3200f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32019371c9d4SSatish Balay x[i] = *aa; 32029371c9d4SSatish Balay if (idx) idx[i] = 0; 3203f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3204f07e67edSHong Zhang x[i] = 0.0; 3205f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3206289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3207f07e67edSHong Zhang if (aj[j] > j) { 3208f07e67edSHong Zhang idx[i] = j; 32092205254eSKarl Rupp break; 32102205254eSKarl Rupp } 3211289a08f5SMatthew Knepley } 3212f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3213f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3214f07e67edSHong Zhang } 3215289a08f5SMatthew Knepley } 3216c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32179371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32189371c9d4SSatish Balay x[i] = *aa; 32199371c9d4SSatish Balay if (idx) idx[i] = *aj; 32209371c9d4SSatish Balay } 32219371c9d4SSatish Balay aa++; 32229371c9d4SSatish Balay aj++; 3223c87e5d42SMatthew Knepley } 3224c87e5d42SMatthew Knepley } 32259566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3228c87e5d42SMatthew Knepley } 3229c87e5d42SMatthew Knepley 3230ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3231d71ae5a4SJacob Faibussowitsch { 3232985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3233d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3234d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3235985db425SBarry Smith PetscScalar *x; 3236ce496241SStefano Zampini const MatScalar *aa, *av; 3237985db425SBarry Smith 3238985db425SBarry Smith PetscFunctionBegin; 323928b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3241ce496241SStefano Zampini aa = av; 3242985db425SBarry Smith ai = a->i; 3243985db425SBarry Smith aj = a->j; 3244985db425SBarry Smith 32459566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32469566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32479566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 324808401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3249985db425SBarry Smith for (i = 0; i < m; i++) { 32509371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32519371c9d4SSatish Balay ai++; 3252d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32539371c9d4SSatish Balay x[i] = *aa; 32549371c9d4SSatish Balay if (idx) idx[i] = 0; 3255985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3256985db425SBarry Smith x[i] = 0.0; 3257985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3258985db425SBarry Smith for (j = 0; j < ncols; j++) { 3259985db425SBarry Smith if (aj[j] > j) { 3260985db425SBarry Smith idx[i] = j; 3261985db425SBarry Smith break; 3262985db425SBarry Smith } 3263985db425SBarry Smith } 3264fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3265fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3266985db425SBarry Smith } 3267985db425SBarry Smith } 3268985db425SBarry Smith for (j = 0; j < ncols; j++) { 32699371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32709371c9d4SSatish Balay x[i] = *aa; 32719371c9d4SSatish Balay if (idx) idx[i] = *aj; 32729371c9d4SSatish Balay } 32739371c9d4SSatish Balay aa++; 32749371c9d4SSatish Balay aj++; 3275e34fafa9SBarry Smith } 3276e34fafa9SBarry Smith } 32779566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3280e34fafa9SBarry Smith } 3281bbead8a2SBarry Smith 3282ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3283d71ae5a4SJacob Faibussowitsch { 3284bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 328533d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3286bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 32870da83c2eSBarry Smith const PetscReal shift = 0.0; 32881a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3289bbead8a2SBarry Smith 3290bbead8a2SBarry Smith PetscFunctionBegin; 3291a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 32924a0d0026SBarry Smith if (a->ibdiagvalid) { 32934a0d0026SBarry Smith if (values) *values = a->ibdiag; 32943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 32954a0d0026SBarry Smith } 32969566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 32974dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3298bbead8a2SBarry Smith diag = a->ibdiag; 3299bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3300bbead8a2SBarry Smith /* factor and invert each block */ 3301bbead8a2SBarry Smith switch (bs) { 3302bbead8a2SBarry Smith case 1: 3303bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33049566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3305ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3306ec1892c8SHong Zhang if (allowzeropivot) { 33077b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33087b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33097b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33109566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 331198921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3312ec1892c8SHong Zhang } 3313bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3314bbead8a2SBarry Smith } 3315bbead8a2SBarry Smith break; 3316bbead8a2SBarry Smith case 2: 3317bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33189371c9d4SSatish Balay ij[0] = 2 * i; 33199371c9d4SSatish Balay ij[1] = 2 * i + 1; 33209566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33219566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33227b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33239566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3324bbead8a2SBarry Smith diag += 4; 3325bbead8a2SBarry Smith } 3326bbead8a2SBarry Smith break; 3327bbead8a2SBarry Smith case 3: 3328bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33299371c9d4SSatish Balay ij[0] = 3 * i; 33309371c9d4SSatish Balay ij[1] = 3 * i + 1; 33319371c9d4SSatish Balay ij[2] = 3 * i + 2; 33329566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33339566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33347b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33359566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3336bbead8a2SBarry Smith diag += 9; 3337bbead8a2SBarry Smith } 3338bbead8a2SBarry Smith break; 3339bbead8a2SBarry Smith case 4: 3340bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33419371c9d4SSatish Balay ij[0] = 4 * i; 33429371c9d4SSatish Balay ij[1] = 4 * i + 1; 33439371c9d4SSatish Balay ij[2] = 4 * i + 2; 33449371c9d4SSatish Balay ij[3] = 4 * i + 3; 33459566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33469566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33477b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33489566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3349bbead8a2SBarry Smith diag += 16; 3350bbead8a2SBarry Smith } 3351bbead8a2SBarry Smith break; 3352bbead8a2SBarry Smith case 5: 3353bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33549371c9d4SSatish Balay ij[0] = 5 * i; 33559371c9d4SSatish Balay ij[1] = 5 * i + 1; 33569371c9d4SSatish Balay ij[2] = 5 * i + 2; 33579371c9d4SSatish Balay ij[3] = 5 * i + 3; 33589371c9d4SSatish Balay ij[4] = 5 * i + 4; 33599566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33617b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3363bbead8a2SBarry Smith diag += 25; 3364bbead8a2SBarry Smith } 3365bbead8a2SBarry Smith break; 3366bbead8a2SBarry Smith case 6: 3367bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33689371c9d4SSatish Balay ij[0] = 6 * i; 33699371c9d4SSatish Balay ij[1] = 6 * i + 1; 33709371c9d4SSatish Balay ij[2] = 6 * i + 2; 33719371c9d4SSatish Balay ij[3] = 6 * i + 3; 33729371c9d4SSatish Balay ij[4] = 6 * i + 4; 33739371c9d4SSatish Balay ij[5] = 6 * i + 5; 33749566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33759566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33767b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33779566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3378bbead8a2SBarry Smith diag += 36; 3379bbead8a2SBarry Smith } 3380bbead8a2SBarry Smith break; 3381bbead8a2SBarry Smith case 7: 3382bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33839371c9d4SSatish Balay ij[0] = 7 * i; 33849371c9d4SSatish Balay ij[1] = 7 * i + 1; 33859371c9d4SSatish Balay ij[2] = 7 * i + 2; 33869371c9d4SSatish Balay ij[3] = 7 * i + 3; 33879371c9d4SSatish Balay ij[4] = 7 * i + 4; 33889371c9d4SSatish Balay ij[5] = 7 * i + 5; 3389cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 33909566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 33919566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 33927b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33939566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3394bbead8a2SBarry Smith diag += 49; 3395bbead8a2SBarry Smith } 3396bbead8a2SBarry Smith break; 3397bbead8a2SBarry Smith default: 33989566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3399bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3400ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34019566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34029566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34037b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34049566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3405bbead8a2SBarry Smith diag += bs2; 3406bbead8a2SBarry Smith } 34079566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3408bbead8a2SBarry Smith } 3409bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 34103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3411bbead8a2SBarry Smith } 3412bbead8a2SBarry Smith 3413d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3414d71ae5a4SJacob Faibussowitsch { 341573a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3416fff043a9SJunchao Zhang PetscScalar a, *aa; 341773a71a0fSBarry Smith PetscInt m, n, i, j, col; 341873a71a0fSBarry Smith 341973a71a0fSBarry Smith PetscFunctionBegin; 342073a71a0fSBarry Smith if (!x->assembled) { 34219566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 342273a71a0fSBarry Smith for (i = 0; i < m; i++) { 342373a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34249566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 342573a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34269566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 342773a71a0fSBarry Smith } 342873a71a0fSBarry Smith } 3429e2ce353bSJunchao Zhang } else { 34309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34319566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3433e2ce353bSJunchao Zhang } 34349566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34359566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 343773a71a0fSBarry Smith } 343873a71a0fSBarry Smith 3439679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3440d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3441d71ae5a4SJacob Faibussowitsch { 3442679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3443679944adSJunchao Zhang PetscScalar a; 3444679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3445679944adSJunchao Zhang 3446679944adSJunchao Zhang PetscFunctionBegin; 3447679944adSJunchao Zhang nskip = high - low; 34489566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3449679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3450679944adSJunchao Zhang for (i = 0; i < m; i++) { 3451679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34529566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3453679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3454679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34559566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3456679944adSJunchao Zhang } 3457e2ce353bSJunchao Zhang } 34589566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34599566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3461679944adSJunchao Zhang } 3462679944adSJunchao Zhang 34630a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3464cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3465cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3466cb5b572fSBarry Smith MatMult_SeqAIJ, 346797304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34687c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34697c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3470f4259b30SLisandro Dalcin NULL, 3471f4259b30SLisandro Dalcin NULL, 3472f4259b30SLisandro Dalcin NULL, 3473f4259b30SLisandro Dalcin /* 10*/ NULL, 3474cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3475f4259b30SLisandro Dalcin NULL, 347641f059aeSBarry Smith MatSOR_SeqAIJ, 347791e9d3e2SHong Zhang MatTranspose_SeqAIJ, 347897304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3479cb5b572fSBarry Smith MatEqual_SeqAIJ, 3480cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3481cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3482cb5b572fSBarry Smith MatNorm_SeqAIJ, 3483f4259b30SLisandro Dalcin /* 20*/ NULL, 3484cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3485cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3486cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3487d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3488f4259b30SLisandro Dalcin NULL, 3489f4259b30SLisandro Dalcin NULL, 3490f4259b30SLisandro Dalcin NULL, 3491f4259b30SLisandro Dalcin NULL, 349226cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 3493f4259b30SLisandro Dalcin NULL, 3494f4259b30SLisandro Dalcin NULL, 3495f4259b30SLisandro Dalcin NULL, 3496f4259b30SLisandro Dalcin NULL, 3497d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3498f4259b30SLisandro Dalcin NULL, 3499f4259b30SLisandro Dalcin NULL, 3500cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3501f4259b30SLisandro Dalcin NULL, 3502d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35037dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3504cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3505cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3506cb5b572fSBarry Smith MatCopy_SeqAIJ, 3507d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3508cb5b572fSBarry Smith MatScale_SeqAIJ, 35097d68702bSBarry Smith MatShift_SeqAIJ, 351079299369SBarry Smith MatDiagonalSet_SeqAIJ, 35116e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 351273a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35133b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35143b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35153b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3516a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 351793dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3518f4259b30SLisandro Dalcin NULL, 3519f4259b30SLisandro Dalcin NULL, 3520cda55fadSBarry Smith MatPermute_SeqAIJ, 3521f4259b30SLisandro Dalcin NULL, 3522f4259b30SLisandro Dalcin /* 59*/ NULL, 3523b9b97703SBarry Smith MatDestroy_SeqAIJ, 3524b9b97703SBarry Smith MatView_SeqAIJ, 3525f4259b30SLisandro Dalcin NULL, 3526f4259b30SLisandro Dalcin NULL, 3527f4259b30SLisandro Dalcin /* 64*/ NULL, 3528321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3529f4259b30SLisandro Dalcin NULL, 3530f4259b30SLisandro Dalcin NULL, 3531f4259b30SLisandro Dalcin NULL, 3532d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3533c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3534f4259b30SLisandro Dalcin NULL, 3535f4259b30SLisandro Dalcin NULL, 3536f4259b30SLisandro Dalcin NULL, 3537f4259b30SLisandro Dalcin /* 74*/ NULL, 35383acb8795SBarry Smith MatFDColoringApply_AIJ, 3539f4259b30SLisandro Dalcin NULL, 3540f4259b30SLisandro Dalcin NULL, 3541f4259b30SLisandro Dalcin NULL, 35426ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3543f4259b30SLisandro Dalcin NULL, 3544f4259b30SLisandro Dalcin NULL, 3545f4259b30SLisandro Dalcin NULL, 3546bc011b1eSHong Zhang MatLoad_SeqAIJ, 3547d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35481cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3549f4259b30SLisandro Dalcin NULL, 3550f4259b30SLisandro Dalcin NULL, 3551f4259b30SLisandro Dalcin NULL, 3552f4259b30SLisandro Dalcin /* 89*/ NULL, 3553f4259b30SLisandro Dalcin NULL, 355426be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3555f4259b30SLisandro Dalcin NULL, 3556f4259b30SLisandro Dalcin NULL, 35578fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3558f4259b30SLisandro Dalcin NULL, 3559f4259b30SLisandro Dalcin NULL, 35606fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3561f4259b30SLisandro Dalcin NULL, 35624222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3563f4259b30SLisandro Dalcin NULL, 3564f4259b30SLisandro Dalcin NULL, 356587d4246cSBarry Smith MatConjugate_SeqAIJ, 3566f4259b30SLisandro Dalcin NULL, 3567d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 356899cafbc1SBarry Smith MatRealPart_SeqAIJ, 3569f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3570f4259b30SLisandro Dalcin NULL, 3571f4259b30SLisandro Dalcin NULL, 3572cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3573f4259b30SLisandro Dalcin NULL, 35742af78befSBarry Smith MatGetRowMin_SeqAIJ, 3575f4259b30SLisandro Dalcin NULL, 3576599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3577f4259b30SLisandro Dalcin /*114*/ NULL, 3578f4259b30SLisandro Dalcin NULL, 3579f4259b30SLisandro Dalcin NULL, 3580f4259b30SLisandro Dalcin NULL, 3581f4259b30SLisandro Dalcin NULL, 3582f4259b30SLisandro Dalcin /*119*/ NULL, 3583f4259b30SLisandro Dalcin NULL, 3584f4259b30SLisandro Dalcin NULL, 3585f4259b30SLisandro Dalcin NULL, 3586b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 35870716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3588a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 358937868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 35900da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3591f4259b30SLisandro Dalcin NULL, 3592f4259b30SLisandro Dalcin /*129*/ NULL, 3593f4259b30SLisandro Dalcin NULL, 3594f4259b30SLisandro Dalcin NULL, 359575648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3596b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3597b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 35982b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3599f4259b30SLisandro Dalcin NULL, 3600f4259b30SLisandro Dalcin NULL, 36013964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3602f4259b30SLisandro Dalcin /*139*/ NULL, 3603f4259b30SLisandro Dalcin NULL, 3604f4259b30SLisandro Dalcin NULL, 36053a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36069c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36074222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36084222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3609f4259b30SLisandro Dalcin NULL, 361072833a62Smarkadams4 NULL, 361172833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36122d776b49SBarry Smith NULL, 3613dec0b466SHong Zhang /*150*/ MatTransposeSymbolic_SeqAIJ, 3614dec0b466SHong Zhang MatEliminateZeros_SeqAIJ}; 361517ab2063SBarry Smith 3616ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3617d71ae5a4SJacob Faibussowitsch { 3618bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 361997f1f81fSBarry Smith PetscInt i, nz, n; 3620bef8e0ddSBarry Smith 3621bef8e0ddSBarry Smith PetscFunctionBegin; 3622bef8e0ddSBarry Smith nz = aij->maxnz; 3623d0f46423SBarry Smith n = mat->rmap->n; 3624ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3625bef8e0ddSBarry Smith aij->nz = nz; 3626ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 36273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3628bef8e0ddSBarry Smith } 3629bef8e0ddSBarry Smith 3630a3bb6f32SFande Kong /* 3631ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3632ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3633ddea5d60SJunchao Zhang */ 3634d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3635d71ae5a4SJacob Faibussowitsch { 3636a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3637eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3638eec179cfSJacob Faibussowitsch PetscHashIter tpos; 363925b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 364025b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3641a3bb6f32SFande Kong 3642a3bb6f32SFande Kong PetscFunctionBegin; 3643a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 36444f572ea9SToby Isaac PetscAssertPointer(mapping, 2); 3645a3bb6f32SFande Kong /* use a table */ 3646eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3647a3bb6f32SFande Kong ec = 0; 364825b670f0SStefano Zampini for (i = 0; i < nz; i++) { 364925b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3650eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3651a3bb6f32SFande Kong if (!data) { 3652a3bb6f32SFande Kong /* one based table */ 3653c76ffc5fSJacob Faibussowitsch PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec)); 3654a3bb6f32SFande Kong } 3655a3bb6f32SFande Kong } 3656a3bb6f32SFande Kong /* form array of columns we need */ 36579566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3658eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3659eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3660eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3661eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3662eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3663a3bb6f32SFande Kong gid--; 3664a3bb6f32SFande Kong lid--; 3665a3bb6f32SFande Kong garray[lid] = gid; 3666a3bb6f32SFande Kong } 36679566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3668eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3669c76ffc5fSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1)); 3670a3bb6f32SFande Kong /* compact out the extra columns in B */ 367125b670f0SStefano Zampini for (i = 0; i < nz; i++) { 367225b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3673eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3674a3bb6f32SFande Kong lid--; 367525b670f0SStefano Zampini jj[i] = lid; 3676a3bb6f32SFande Kong } 36779566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3678eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 36799566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36809566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36819566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 36823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3683a3bb6f32SFande Kong } 3684a3bb6f32SFande Kong 3685bef8e0ddSBarry Smith /*@ 3686bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3687bef8e0ddSBarry Smith in the matrix. 3688bef8e0ddSBarry Smith 3689bef8e0ddSBarry Smith Input Parameters: 369011a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3691bef8e0ddSBarry Smith - indices - the column indices 3692bef8e0ddSBarry Smith 369315091d37SBarry Smith Level: advanced 369415091d37SBarry Smith 3695bef8e0ddSBarry Smith Notes: 3696bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3697bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 369811a5261eSBarry Smith of the `MatSetValues()` operation. 3699bef8e0ddSBarry Smith 3700bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 370111a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3702bef8e0ddSBarry Smith 370311a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3704bef8e0ddSBarry Smith 3705b9617806SBarry Smith The indices should start with zero, not one. 3706b9617806SBarry Smith 37071cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ` 3708bef8e0ddSBarry Smith @*/ 3709d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3710d71ae5a4SJacob Faibussowitsch { 3711bef8e0ddSBarry Smith PetscFunctionBegin; 37120700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 37134f572ea9SToby Isaac PetscAssertPointer(indices, 2); 3714cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 37153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3716bef8e0ddSBarry Smith } 3717bef8e0ddSBarry Smith 3718ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3719d71ae5a4SJacob Faibussowitsch { 3720be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3721d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3722be6bf707SBarry Smith 3723be6bf707SBarry Smith PetscFunctionBegin; 372428b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3725be6bf707SBarry Smith 3726be6bf707SBarry Smith /* allocate space for values if not already there */ 37274dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3728be6bf707SBarry Smith 3729be6bf707SBarry Smith /* copy values over */ 37309566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 37313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3732be6bf707SBarry Smith } 3733be6bf707SBarry Smith 3734be6bf707SBarry Smith /*@ 373520f4b53cSBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the 3736be6bf707SBarry Smith nonlinear portion. 3737be6bf707SBarry Smith 3738c3339decSBarry Smith Logically Collect 3739be6bf707SBarry Smith 374027430b45SBarry Smith Input Parameter: 374111a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3742be6bf707SBarry Smith 374315091d37SBarry Smith Level: advanced 374415091d37SBarry Smith 37452920cce0SJacob Faibussowitsch Example Usage: 374627430b45SBarry Smith .vb 37472ef1f0ffSBarry Smith Using SNES 374827430b45SBarry Smith Create Jacobian matrix 374927430b45SBarry Smith Set linear terms into matrix 375027430b45SBarry Smith Apply boundary conditions to matrix, at this time matrix must have 375127430b45SBarry Smith final nonzero structure (i.e. setting the nonlinear terms and applying 375227430b45SBarry Smith boundary conditions again will not change the nonzero structure 375327430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 375427430b45SBarry Smith MatStoreValues(mat); 375527430b45SBarry Smith Call SNESSetJacobian() with matrix 375627430b45SBarry Smith In your Jacobian routine 375727430b45SBarry Smith MatRetrieveValues(mat); 375827430b45SBarry Smith Set nonlinear terms in matrix 3759be6bf707SBarry Smith 376027430b45SBarry Smith Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself: 376127430b45SBarry Smith // build linear portion of Jacobian 376227430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 376327430b45SBarry Smith MatStoreValues(mat); 376427430b45SBarry Smith loop over nonlinear iterations 376527430b45SBarry Smith MatRetrieveValues(mat); 376627430b45SBarry Smith // call MatSetValues(mat,...) to set nonliner portion of Jacobian 376727430b45SBarry Smith // call MatAssemblyBegin/End() on matrix 376827430b45SBarry Smith Solve linear system with Jacobian 376927430b45SBarry Smith endloop 377027430b45SBarry Smith .ve 3771be6bf707SBarry Smith 3772be6bf707SBarry Smith Notes: 3773da81f932SPierre Jolivet Matrix must already be assembled before calling this routine 377411a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3775be6bf707SBarry Smith calling this routine. 3776be6bf707SBarry Smith 37770c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37780c468ba9SBarry Smith and does not allocated additional space. 37790c468ba9SBarry Smith 3780fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()` 3781be6bf707SBarry Smith @*/ 3782d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3783d71ae5a4SJacob Faibussowitsch { 3784be6bf707SBarry Smith PetscFunctionBegin; 37850700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 378628b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 378728b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3788cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 37893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3790be6bf707SBarry Smith } 3791be6bf707SBarry Smith 3792ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3793d71ae5a4SJacob Faibussowitsch { 3794be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3795d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3796be6bf707SBarry Smith 3797be6bf707SBarry Smith PetscFunctionBegin; 379828b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 379928b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3800be6bf707SBarry Smith /* copy values over */ 38019566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 38023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3803be6bf707SBarry Smith } 3804be6bf707SBarry Smith 3805be6bf707SBarry Smith /*@ 380620f4b53cSBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()` 3807be6bf707SBarry Smith 3808c3339decSBarry Smith Logically Collect 3809be6bf707SBarry Smith 38102fe279fdSBarry Smith Input Parameter: 381111a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3812be6bf707SBarry Smith 381315091d37SBarry Smith Level: advanced 381415091d37SBarry Smith 38151cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()` 3816be6bf707SBarry Smith @*/ 3817d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3818d71ae5a4SJacob Faibussowitsch { 3819be6bf707SBarry Smith PetscFunctionBegin; 38200700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 382128b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 382228b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3823cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 38243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3825be6bf707SBarry Smith } 3826be6bf707SBarry Smith 382717ab2063SBarry Smith /*@C 382811a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38290d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 383020f4b53cSBarry Smith the user should preallocate the matrix storage by setting the parameter `nz` 383120f4b53cSBarry Smith (or the array `nnz`). 383217ab2063SBarry Smith 3833d083f849SBarry Smith Collective 3834db81eaa0SLois Curfman McInnes 383517ab2063SBarry Smith Input Parameters: 383611a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 383717ab2063SBarry Smith . m - number of rows 383817ab2063SBarry Smith . n - number of columns 383917ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 384051c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38410298fd71SBarry Smith (possibly different for each row) or NULL 384217ab2063SBarry Smith 384317ab2063SBarry Smith Output Parameter: 3844416022c9SBarry Smith . A - the matrix 384517ab2063SBarry Smith 38462ef1f0ffSBarry Smith Options Database Keys: 38472ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 38482ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 38492ef1f0ffSBarry Smith 38502ef1f0ffSBarry Smith Level: intermediate 3851175b88e8SBarry Smith 3852b259b22eSLois Curfman McInnes Notes: 385377433607SBarry Smith It is recommend to use `MatCreateFromOptions()` instead of this routine 385477433607SBarry Smith 38552ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 385649a6f317SBarry Smith 38572ef1f0ffSBarry Smith The `MATSEQAIJ` format, also called 38582ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 38590002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 38602ef1f0ffSBarry Smith either one (as in Fortran) or zero. 386117ab2063SBarry Smith 386220f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 38632ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 386420f4b53cSBarry Smith allocation. 386517ab2063SBarry Smith 3866682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38674fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3868682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38696c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38706c7ebb05SLois Curfman McInnes 38711cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 387217ab2063SBarry Smith @*/ 3873d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3874d71ae5a4SJacob Faibussowitsch { 38753a40ed3dSBarry Smith PetscFunctionBegin; 38769566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38779566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38789566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 38803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3881273d9f13SBarry Smith } 3882273d9f13SBarry Smith 3883273d9f13SBarry Smith /*@C 3884273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3885273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3886273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3887273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3888273d9f13SBarry Smith 3889d083f849SBarry Smith Collective 3890273d9f13SBarry Smith 3891273d9f13SBarry Smith Input Parameters: 38921c4f3114SJed Brown + B - The matrix 3893273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3894273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38950298fd71SBarry Smith (possibly different for each row) or NULL 3896273d9f13SBarry Smith 38972ef1f0ffSBarry Smith Options Database Keys: 38982ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 38992ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 39002ef1f0ffSBarry Smith 39012ef1f0ffSBarry Smith Level: intermediate 39022ef1f0ffSBarry Smith 3903273d9f13SBarry Smith Notes: 39042ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 390549a6f317SBarry Smith 390611a5261eSBarry Smith The `MATSEQAIJ` format also called 39072ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 3908273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3909273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3910273d9f13SBarry Smith 39112ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 39122ef1f0ffSBarry Smith Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 39132ef1f0ffSBarry Smith allocation. 3914273d9f13SBarry Smith 391511a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3916aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3917aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3918aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3919aa95bbe8SBarry Smith 392011a5261eSBarry Smith Developer Notes: 392111a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3922a96a251dSBarry Smith entries or columns indices 3923a96a251dSBarry Smith 3924273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3925273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3926273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3927273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3928273d9f13SBarry Smith 39291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3930db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3931273d9f13SBarry Smith @*/ 3932d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3933d71ae5a4SJacob Faibussowitsch { 3934a23d5eceSKris Buschelman PetscFunctionBegin; 39356ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39366ba663aaSJed Brown PetscValidType(B, 1); 3937cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 39383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3939a23d5eceSKris Buschelman } 3940a23d5eceSKris Buschelman 3941d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3942d71ae5a4SJacob Faibussowitsch { 3943ad79cf63SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 39442576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 394597f1f81fSBarry Smith PetscInt i; 3946273d9f13SBarry Smith 3947273d9f13SBarry Smith PetscFunctionBegin; 3948ad79cf63SBarry Smith if (B->hash_active) { 3949aea10558SJacob Faibussowitsch B->ops[0] = b->cops; 3950ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 3951ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 3952ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 3953ad79cf63SBarry Smith } 39542576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3955a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3956c461c341SBarry Smith skipallocation = PETSC_TRUE; 3957c461c341SBarry Smith nz = 0; 3958c461c341SBarry Smith } 39599566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39609566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3961899cda47SBarry Smith 3962435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 396308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 3964cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3965d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 396608401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 396708401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3968b73539f3SBarry Smith } 3969b73539f3SBarry Smith } 3970b73539f3SBarry Smith 3971273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 3972ab93d7beSBarry Smith if (!skipallocation) { 39734dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3974071fcb05SBarry Smith if (!b->ilen) { 3975071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39769566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3977071fcb05SBarry Smith } else { 39789566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39792ee49352SLisandro Dalcin } 3980aa624791SPierre Jolivet if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); 3981273d9f13SBarry Smith if (!nnz) { 3982435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3983c62bd62aSJed Brown else if (nz < 0) nz = 1; 39845d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 3985d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 3986d0f46423SBarry Smith nz = nz * B->rmap->n; 3987273d9f13SBarry Smith } else { 3988c73702f5SBarry Smith PetscInt64 nz64 = 0; 39899371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 39909371c9d4SSatish Balay b->imax[i] = nnz[i]; 39919371c9d4SSatish Balay nz64 += nnz[i]; 39929371c9d4SSatish Balay } 39939566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 3994273d9f13SBarry Smith } 3995ab93d7beSBarry Smith 3996273d9f13SBarry Smith /* allocate the matrix space */ 399753dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 39989566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 3999396832f4SHong Zhang if (B->structure_only) { 40009566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &b->j)); 40019566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i)); 4002396832f4SHong Zhang } else { 40039566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i)); 4004396832f4SHong Zhang } 4005bfeeae90SHong Zhang b->i[0] = 0; 4006ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4007396832f4SHong Zhang if (B->structure_only) { 4008396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4009396832f4SHong Zhang b->free_a = PETSC_FALSE; 4010396832f4SHong Zhang } else { 4011273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4012e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4013396832f4SHong Zhang } 4014e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4015c461c341SBarry Smith } else { 4016e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4017e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4018c461c341SBarry Smith } 4019273d9f13SBarry Smith 4020846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4021846b4da1SFande Kong /* reserve user-requested sparsity */ 40229566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4023846b4da1SFande Kong } 4024846b4da1SFande Kong 4025273d9f13SBarry Smith b->nz = 0; 4026273d9f13SBarry Smith b->maxnz = nz; 4027273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40281baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4029cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4030cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40315519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40325519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40335519a089SJose E. Roman */ 40345519a089SJose E. Roman B->nonzerostate++; 40353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4036273d9f13SBarry Smith } 4037273d9f13SBarry Smith 4038ba38deedSJacob Faibussowitsch static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4039d71ae5a4SJacob Faibussowitsch { 4040846b4da1SFande Kong Mat_SeqAIJ *a; 4041a5bbaf83SFande Kong PetscInt i; 40421f14be2bSBarry Smith PetscBool skipreset; 4043846b4da1SFande Kong 4044846b4da1SFande Kong PetscFunctionBegin; 4045846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 404614d0e64fSAlex Lindsay 404714d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 40483ba16761SJacob Faibussowitsch if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS); 404914d0e64fSAlex Lindsay 4050846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40512c814fdeSFande Kong /* if no saved info, we error out */ 405228b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40532c814fdeSFande Kong 40541f14be2bSBarry Smith PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40552c814fdeSFande Kong 40561f14be2bSBarry Smith PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset)); 40571f14be2bSBarry Smith if (!skipreset) { 40589566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40599566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4060846b4da1SFande Kong a->i[0] = 0; 4061ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4062846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4063846b4da1SFande Kong a->nz = 0; 4064846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4065846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4066846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4067846b4da1SFande Kong A->assembled = PETSC_FALSE; 40681f14be2bSBarry Smith } 40693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4070846b4da1SFande Kong } 4071846b4da1SFande Kong 407258d36128SBarry Smith /*@ 407311a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4074a1661176SMatthew Knepley 4075a1661176SMatthew Knepley Input Parameters: 4076a1661176SMatthew Knepley + B - the matrix 4077a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4078a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4079a1661176SMatthew Knepley - v - optional values in the matrix 4080a1661176SMatthew Knepley 4081a1661176SMatthew Knepley Level: developer 4082a1661176SMatthew Knepley 40836a9b8d82SBarry Smith Notes: 40842ef1f0ffSBarry Smith The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 408558d36128SBarry Smith 40866a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 40876a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 40886a9b8d82SBarry Smith 40896a9b8d82SBarry Smith Developer Notes: 40902ef1f0ffSBarry Smith An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and 40912ef1f0ffSBarry Smith then just copies the `v` values directly with `PetscMemcpy()`. 40926a9b8d82SBarry Smith 409311a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 40946a9b8d82SBarry Smith 4095fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()` 4096a1661176SMatthew Knepley @*/ 4097d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4098d71ae5a4SJacob Faibussowitsch { 4099a1661176SMatthew Knepley PetscFunctionBegin; 41000700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 41016ba663aaSJed Brown PetscValidType(B, 1); 4102cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 41033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4104a1661176SMatthew Knepley } 4105a1661176SMatthew Knepley 4106ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4107d71ae5a4SJacob Faibussowitsch { 4108a1661176SMatthew Knepley PetscInt i; 4109a1661176SMatthew Knepley PetscInt m, n; 4110a1661176SMatthew Knepley PetscInt nz; 41116a9b8d82SBarry Smith PetscInt *nnz; 4112a1661176SMatthew Knepley 4113a1661176SMatthew Knepley PetscFunctionBegin; 4114aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4115779a8d59SSatish Balay 41169566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41179566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4118779a8d59SSatish Balay 41199566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4121a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4122b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 412308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4124a1661176SMatthew Knepley nnz[i] = nz; 4125a1661176SMatthew Knepley } 41269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41279566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4128a1661176SMatthew Knepley 412948a46eb9SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES)); 4130a1661176SMatthew Knepley 41319566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41329566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4133a1661176SMatthew Knepley 41349566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 41353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4136a1661176SMatthew Knepley } 4137a1661176SMatthew Knepley 4138ad7e164aSPierre Jolivet /*@ 41392ef1f0ffSBarry Smith MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`. 4140ad7e164aSPierre Jolivet 4141ad7e164aSPierre Jolivet Input Parameters: 4142ad7e164aSPierre Jolivet + A - left-hand side matrix 4143ad7e164aSPierre Jolivet . B - right-hand side matrix 414411a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4145ad7e164aSPierre Jolivet 4146ad7e164aSPierre Jolivet Output Parameter: 41472ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B` 4148ad7e164aSPierre Jolivet 4149ad7e164aSPierre Jolivet Level: intermediate 4150ad7e164aSPierre Jolivet 415111a5261eSBarry Smith Note: 415211a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4153ad7e164aSPierre Jolivet 41541cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4155ad7e164aSPierre Jolivet @*/ 4156d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4157d71ae5a4SJacob Faibussowitsch { 4158ad7e164aSPierre Jolivet PetscFunctionBegin; 4159ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4160ad7e164aSPierre Jolivet PetscValidType(A, 1); 4161ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4162ad7e164aSPierre Jolivet PetscValidType(B, 2); 41634f572ea9SToby Isaac PetscAssertPointer(C, 4); 4164ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4165ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4166ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4167ad7e164aSPierre Jolivet } 4168cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 41693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4170ad7e164aSPierre Jolivet } 4171ad7e164aSPierre Jolivet 4172ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4173d71ae5a4SJacob Faibussowitsch { 4174ad7e164aSPierre Jolivet Mat newmat; 4175ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4176ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4177ad7e164aSPierre Jolivet PetscScalar *v; 4178fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4179ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4180ad7e164aSPierre Jolivet PetscBool flg; 4181ad7e164aSPierre Jolivet 4182ad7e164aSPierre Jolivet PetscFunctionBegin; 418328b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 418428b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 418528b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 418628b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 41879566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 418828b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4189aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4190ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 41919566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 41929566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 41939566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 41949566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4195ad7e164aSPierre Jolivet i[0] = 0; 4196ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4197ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4198ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4199ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4200ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4201ad7e164aSPierre Jolivet } 4202ad7e164aSPierre Jolivet } 4203ad7e164aSPierre Jolivet } 42049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4205ad7e164aSPierre Jolivet *C = newmat; 42069566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4207ad7e164aSPierre Jolivet nnz = 0; 4208ad7e164aSPierre Jolivet } 42099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4212ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4213ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4214ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4215ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4216ad7e164aSPierre Jolivet } 4217ad7e164aSPierre Jolivet } 4218ad7e164aSPierre Jolivet } 42199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 42223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4223ad7e164aSPierre Jolivet } 4224ad7e164aSPierre Jolivet 4225c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4226af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4227170fe5c8SBarry Smith 4228170fe5c8SBarry Smith /* 4229170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4230170fe5c8SBarry Smith 4231170fe5c8SBarry Smith n p p 42322da392ccSBarry Smith [ ] [ ] [ ] 42332da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42342da392ccSBarry Smith [ ] [ ] [ ] 4235170fe5c8SBarry Smith 4236170fe5c8SBarry Smith */ 4237d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4238d71ae5a4SJacob Faibussowitsch { 4239170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4240170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4241170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 424286214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4243170fe5c8SBarry Smith const PetscInt *ii, *idx; 4244170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4245170fe5c8SBarry Smith PetscScalar *c, *c_q; 424686214ceeSStefano Zampini PetscInt clda = sub_c->lda; 424786214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4248170fe5c8SBarry Smith 4249170fe5c8SBarry Smith PetscFunctionBegin; 4250d0f46423SBarry Smith m = A->rmap->n; 4251d0f46423SBarry Smith n = A->cmap->n; 4252d0f46423SBarry Smith p = B->cmap->n; 4253170fe5c8SBarry Smith a = sub_a->v; 4254170fe5c8SBarry Smith b = sub_b->a; 4255170fe5c8SBarry Smith c = sub_c->v; 425686214ceeSStefano Zampini if (clda == m) { 42579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 425886214ceeSStefano Zampini } else { 425986214ceeSStefano Zampini for (j = 0; j < p; j++) 42609371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 426186214ceeSStefano Zampini } 4262170fe5c8SBarry Smith ii = sub_b->i; 4263170fe5c8SBarry Smith idx = sub_b->j; 4264170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4265170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4266170fe5c8SBarry Smith while (q-- > 0) { 426786214ceeSStefano Zampini c_q = c + clda * (*idx); 426886214ceeSStefano Zampini a_q = a + alda * i; 4269854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4270170fe5c8SBarry Smith idx++; 4271170fe5c8SBarry Smith b++; 4272170fe5c8SBarry Smith } 4273170fe5c8SBarry Smith } 42743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4275170fe5c8SBarry Smith } 4276170fe5c8SBarry Smith 4277d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4278d71ae5a4SJacob Faibussowitsch { 4279d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 428086214ceeSStefano Zampini PetscBool cisdense; 4281170fe5c8SBarry Smith 4282170fe5c8SBarry Smith PetscFunctionBegin; 428308401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 42849566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 42859566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 4286d5e393b6SSuyash Tandon PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, "")); 428748a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 42889566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4289d73949e8SHong Zhang 42904222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 42913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4292170fe5c8SBarry Smith } 4293170fe5c8SBarry Smith 42940bad9183SKris Buschelman /*MC 4295fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 42960bad9183SKris Buschelman based on compressed sparse row format. 42970bad9183SKris Buschelman 42982ef1f0ffSBarry Smith Options Database Key: 42990bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43000bad9183SKris Buschelman 43010bad9183SKris Buschelman Level: beginner 43020bad9183SKris Buschelman 43030cd7f59aSBarry Smith Notes: 43042ef1f0ffSBarry Smith `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values, 43050cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43060cd7f59aSBarry Smith in the matrix 43070cd7f59aSBarry Smith 430811a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 430911a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43100cd7f59aSBarry Smith 431111a5261eSBarry Smith Developer Note: 43122ef1f0ffSBarry Smith It would be nice if all matrix formats supported passing `NULL` in for the numerical values 43130cd7f59aSBarry Smith 43141cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43150bad9183SKris Buschelman M*/ 43160bad9183SKris Buschelman 4317ccd284c7SBarry Smith /*MC 4318ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4319ccd284c7SBarry Smith 432011a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 432111a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 432211a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4323ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4324ccd284c7SBarry Smith the above preallocation routines for simplicity. 4325ccd284c7SBarry Smith 43262ef1f0ffSBarry Smith Options Database Key: 432711a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4328ccd284c7SBarry Smith 43292ef1f0ffSBarry Smith Level: beginner 43302ef1f0ffSBarry Smith 433111a5261eSBarry Smith Note: 433211a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4333ccd284c7SBarry Smith enough exist. 4334ccd284c7SBarry Smith 43351cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4336ccd284c7SBarry Smith M*/ 4337ccd284c7SBarry Smith 4338ccd284c7SBarry Smith /*MC 4339ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4340ccd284c7SBarry Smith 43412ef1f0ffSBarry Smith Options Database Key: 43422ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 43432ef1f0ffSBarry Smith 43442ef1f0ffSBarry Smith Level: beginner 43452ef1f0ffSBarry Smith 43462ef1f0ffSBarry Smith Note: 434711a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 434811a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 434911a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4350ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4351ccd284c7SBarry Smith the above preallocation routines for simplicity. 4352ccd284c7SBarry Smith 43531cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4354ccd284c7SBarry Smith M*/ 4355ccd284c7SBarry Smith 43567906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43577906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43587906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43597906f579SHong Zhang #endif 4360d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4361d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4362d24d4204SJose E. Roman #endif 43637906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43647906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43657906f579SHong Zhang #endif 43667906f579SHong Zhang 4367d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4368c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43694222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43707906f579SHong Zhang 43718c778c55SBarry Smith /*@C 437211a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43738c778c55SBarry Smith 43748c778c55SBarry Smith Not Collective 43758c778c55SBarry Smith 43768c778c55SBarry Smith Input Parameter: 4377fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 43788c778c55SBarry Smith 43798c778c55SBarry Smith Output Parameter: 43808c778c55SBarry Smith . array - pointer to the data 43818c778c55SBarry Smith 43828c778c55SBarry Smith Level: intermediate 43838c778c55SBarry Smith 4384fe59aa6dSJacob Faibussowitsch Fortran Notes: 43850ab4885dSBarry Smith `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()` 43860ab4885dSBarry Smith 43871cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 43888c778c55SBarry Smith @*/ 4389d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array) 4390d71ae5a4SJacob Faibussowitsch { 4391d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 43928c778c55SBarry Smith 43938c778c55SBarry Smith PetscFunctionBegin; 4394d67d9f35SJunchao Zhang if (aij->ops->getarray) { 43959566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4396d67d9f35SJunchao Zhang } else { 4397d67d9f35SJunchao Zhang *array = aij->a; 4398d67d9f35SJunchao Zhang } 43993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4400d67d9f35SJunchao Zhang } 4401d67d9f35SJunchao Zhang 4402d67d9f35SJunchao Zhang /*@C 440311a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4404d67d9f35SJunchao Zhang 4405d67d9f35SJunchao Zhang Not Collective 4406d67d9f35SJunchao Zhang 4407d67d9f35SJunchao Zhang Input Parameters: 4408fe59aa6dSJacob Faibussowitsch + A - a `MATSEQAIJ` matrix 4409d67d9f35SJunchao Zhang - array - pointer to the data 4410d67d9f35SJunchao Zhang 4411d67d9f35SJunchao Zhang Level: intermediate 4412d67d9f35SJunchao Zhang 4413fe59aa6dSJacob Faibussowitsch Fortran Notes: 44140ab4885dSBarry Smith `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()` 44150ab4885dSBarry Smith 44161cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4417d67d9f35SJunchao Zhang @*/ 4418d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array) 4419d71ae5a4SJacob Faibussowitsch { 4420d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4421d67d9f35SJunchao Zhang 4422d67d9f35SJunchao Zhang PetscFunctionBegin; 4423d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44249566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4425d67d9f35SJunchao Zhang } else { 4426d67d9f35SJunchao Zhang *array = NULL; 4427d67d9f35SJunchao Zhang } 44289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44299566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44318c778c55SBarry Smith } 44328c778c55SBarry Smith 443321e72a00SBarry Smith /*@C 443411a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44358f1ea47aSStefano Zampini 44360ab4885dSBarry Smith Not Collective; No Fortran Support 44378f1ea47aSStefano Zampini 44388f1ea47aSStefano Zampini Input Parameter: 4439fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44408f1ea47aSStefano Zampini 44418f1ea47aSStefano Zampini Output Parameter: 44428f1ea47aSStefano Zampini . array - pointer to the data 44438f1ea47aSStefano Zampini 44448f1ea47aSStefano Zampini Level: intermediate 44458f1ea47aSStefano Zampini 44461cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44478f1ea47aSStefano Zampini @*/ 4448d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array) 4449d71ae5a4SJacob Faibussowitsch { 4450d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44518f1ea47aSStefano Zampini 44528f1ea47aSStefano Zampini PetscFunctionBegin; 4453d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44549566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4455d67d9f35SJunchao Zhang } else { 4456d67d9f35SJunchao Zhang *array = aij->a; 4457d67d9f35SJunchao Zhang } 44583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44598f1ea47aSStefano Zampini } 44608f1ea47aSStefano Zampini 44618f1ea47aSStefano Zampini /*@C 446211a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44638f1ea47aSStefano Zampini 44640ab4885dSBarry Smith Not Collective; No Fortran Support 44658f1ea47aSStefano Zampini 44668f1ea47aSStefano Zampini Input Parameter: 4467fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44688f1ea47aSStefano Zampini 44698f1ea47aSStefano Zampini Output Parameter: 44708f1ea47aSStefano Zampini . array - pointer to the data 44718f1ea47aSStefano Zampini 44728f1ea47aSStefano Zampini Level: intermediate 44738f1ea47aSStefano Zampini 44741cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44758f1ea47aSStefano Zampini @*/ 4476d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array) 4477d71ae5a4SJacob Faibussowitsch { 4478d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44798f1ea47aSStefano Zampini 44808f1ea47aSStefano Zampini PetscFunctionBegin; 4481d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44829566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4483d67d9f35SJunchao Zhang } else { 4484d67d9f35SJunchao Zhang *array = NULL; 4485d67d9f35SJunchao Zhang } 44863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4487d67d9f35SJunchao Zhang } 4488d67d9f35SJunchao Zhang 4489d67d9f35SJunchao Zhang /*@C 449011a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4491d67d9f35SJunchao Zhang 44920ab4885dSBarry Smith Not Collective; No Fortran Support 4493d67d9f35SJunchao Zhang 4494d67d9f35SJunchao Zhang Input Parameter: 4495fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 4496d67d9f35SJunchao Zhang 4497d67d9f35SJunchao Zhang Output Parameter: 4498d67d9f35SJunchao Zhang . array - pointer to the data 4499d67d9f35SJunchao Zhang 4500d67d9f35SJunchao Zhang Level: intermediate 4501d67d9f35SJunchao Zhang 45021cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4503d67d9f35SJunchao Zhang @*/ 4504d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array) 4505d71ae5a4SJacob Faibussowitsch { 4506d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4507d67d9f35SJunchao Zhang 4508d67d9f35SJunchao Zhang PetscFunctionBegin; 4509d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45109566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4511d67d9f35SJunchao Zhang } else { 4512d67d9f35SJunchao Zhang *array = aij->a; 4513d67d9f35SJunchao Zhang } 45149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45159566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 45163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4517d67d9f35SJunchao Zhang } 4518d67d9f35SJunchao Zhang 4519d67d9f35SJunchao Zhang /*@C 4520d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4521d67d9f35SJunchao Zhang 45220ab4885dSBarry Smith Not Collective; No Fortran Support 4523d67d9f35SJunchao Zhang 4524d67d9f35SJunchao Zhang Input Parameter: 4525fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix 4526d67d9f35SJunchao Zhang 4527d67d9f35SJunchao Zhang Output Parameter: 4528d67d9f35SJunchao Zhang . array - pointer to the data 4529d67d9f35SJunchao Zhang 4530d67d9f35SJunchao Zhang Level: intermediate 4531d67d9f35SJunchao Zhang 45321cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4533d67d9f35SJunchao Zhang @*/ 4534d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array) 4535d71ae5a4SJacob Faibussowitsch { 4536d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4537d67d9f35SJunchao Zhang 4538d67d9f35SJunchao Zhang PetscFunctionBegin; 4539d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45409566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4541d67d9f35SJunchao Zhang } else { 4542d67d9f35SJunchao Zhang *array = NULL; 4543d67d9f35SJunchao Zhang } 45443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45458f1ea47aSStefano Zampini } 45468f1ea47aSStefano Zampini 45478f1ea47aSStefano Zampini /*@C 454811a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45497ee59b9bSJunchao Zhang 45500ab4885dSBarry Smith Not Collective; No Fortran Support 45517ee59b9bSJunchao Zhang 45527ee59b9bSJunchao Zhang Input Parameter: 455311a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45547ee59b9bSJunchao Zhang 45557ee59b9bSJunchao Zhang Output Parameters: 45567ee59b9bSJunchao Zhang + i - row map array of the matrix 45577ee59b9bSJunchao Zhang . j - column index array of the matrix 45587ee59b9bSJunchao Zhang . a - data array of the matrix 4559fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays 45607ee59b9bSJunchao Zhang 4561fe59aa6dSJacob Faibussowitsch Level: developer 45622ef1f0ffSBarry Smith 45637ee59b9bSJunchao Zhang Notes: 45642ef1f0ffSBarry Smith Any of the output parameters can be `NULL`, in which case the corresponding value is not returned. 45657ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45667ee59b9bSJunchao Zhang 45677ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45682ef1f0ffSBarry Smith If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix. 45697ee59b9bSJunchao Zhang 45701cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45717ee59b9bSJunchao Zhang @*/ 4572d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype) 4573d71ae5a4SJacob Faibussowitsch { 45747ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45757ee59b9bSJunchao Zhang 45767ee59b9bSJunchao Zhang PetscFunctionBegin; 45777ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45787ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45797ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45807ee59b9bSJunchao Zhang } else { 45817ee59b9bSJunchao Zhang if (i) *i = aij->i; 45827ee59b9bSJunchao Zhang if (j) *j = aij->j; 45837ee59b9bSJunchao Zhang if (a) *a = aij->a; 45847ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 45857ee59b9bSJunchao Zhang } 45863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45877ee59b9bSJunchao Zhang } 45887ee59b9bSJunchao Zhang 45897ee59b9bSJunchao Zhang /*@C 459021e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 459121e72a00SBarry Smith 459221e72a00SBarry Smith Not Collective 459321e72a00SBarry Smith 459421e72a00SBarry Smith Input Parameter: 4595fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 459621e72a00SBarry Smith 459721e72a00SBarry Smith Output Parameter: 459821e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 459921e72a00SBarry Smith 460021e72a00SBarry Smith Level: intermediate 460121e72a00SBarry Smith 46021cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 460321e72a00SBarry Smith @*/ 4604d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4605d71ae5a4SJacob Faibussowitsch { 460621e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 460721e72a00SBarry Smith 460821e72a00SBarry Smith PetscFunctionBegin; 460921e72a00SBarry Smith *nz = aij->rmax; 46103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 461121e72a00SBarry Smith } 461221e72a00SBarry Smith 46132c4ab24aSJunchao Zhang static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void *data) 46142c4ab24aSJunchao Zhang { 46152c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)data; 46162c4ab24aSJunchao Zhang PetscFunctionBegin; 46172c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->perm)); 46182c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->jmap)); 46192c4ab24aSJunchao Zhang PetscCall(PetscFree(coo)); 46202c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS); 46212c4ab24aSJunchao Zhang } 46222c4ab24aSJunchao Zhang 4623d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4624d71ae5a4SJacob Faibussowitsch { 4625394ed5ebSJunchao Zhang MPI_Comm comm; 4626394ed5ebSJunchao Zhang PetscInt *i, *j; 4627394ed5ebSJunchao Zhang PetscInt M, N, row; 4628394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4629394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4630394ed5ebSJunchao Zhang PetscInt *Aj; 4631394ed5ebSJunchao Zhang PetscScalar *Aa; 4632cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)(mat->data); 4633cbc6b225SStefano Zampini MatType rtype; 4634394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 46352c4ab24aSJunchao Zhang PetscContainer container; 46362c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 4637394ed5ebSJunchao Zhang 4638394ed5ebSJunchao Zhang PetscFunctionBegin; 46399566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46409566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4641e8729f6fSJunchao Zhang i = coo_i; 4642e8729f6fSJunchao Zhang j = coo_j; 46439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 4644394ed5ebSJunchao Zhang for (k = 0; k < coo_n; k++) { /* Ignore entries with negative row or col indices */ 4645394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4646394ed5ebSJunchao Zhang perm[k] = k; 4647394ed5ebSJunchao Zhang } 4648394ed5ebSJunchao Zhang 4649394ed5ebSJunchao Zhang /* Sort by row */ 46509566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 4651651b1cf9SStefano Zampini 4652651b1cf9SStefano Zampini /* Advance k to the first row with a non-negative index */ 4653651b1cf9SStefano Zampini for (k = 0; k < coo_n; k++) 46549371c9d4SSatish Balay if (i[k] >= 0) break; 4655394ed5ebSJunchao Zhang nneg = k; 46569566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4657394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 465835cb6cd3SPierre Jolivet jmap++; /* Inc jmap by 1 for convenience */ 4659394ed5ebSJunchao Zhang 46609566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M + 1, &Ai)); /* CSR of A */ 46619566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4662394ed5ebSJunchao Zhang 4663651b1cf9SStefano Zampini /* Support for HYPRE */ 4664651b1cf9SStefano Zampini PetscBool hypre; 4665651b1cf9SStefano Zampini const char *name; 4666651b1cf9SStefano Zampini PetscCall(PetscObjectGetName((PetscObject)mat, &name)); 4667651b1cf9SStefano Zampini PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre)); 4668651b1cf9SStefano Zampini 4669394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 467035cb6cd3SPierre Jolivet Ai++; /* Inc by 1 for convenience */ 4671394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4672394ed5ebSJunchao Zhang while (k < coo_n) { 4673394ed5ebSJunchao Zhang row = i[k]; 4674394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4675394ed5ebSJunchao Zhang while (k < coo_n && i[k] == row) k++; 4676394ed5ebSJunchao Zhang end = k; 4677651b1cf9SStefano Zampini /* hack for HYPRE: swap min column to diag so that diagonal values will go first */ 4678651b1cf9SStefano Zampini if (hypre) { 4679651b1cf9SStefano Zampini PetscInt minj = PETSC_MAX_INT; 4680651b1cf9SStefano Zampini PetscBool hasdiag = PETSC_FALSE; 4681651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4682651b1cf9SStefano Zampini hasdiag = (PetscBool)(hasdiag || (j[p] == row)); 4683651b1cf9SStefano Zampini minj = PetscMin(minj, j[p]); 4684651b1cf9SStefano Zampini } 4685651b1cf9SStefano Zampini if (hasdiag) { 4686651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4687651b1cf9SStefano Zampini if (j[p] == minj) j[p] = row; 4688651b1cf9SStefano Zampini else if (j[p] == row) j[p] = minj; 4689651b1cf9SStefano Zampini } 4690651b1cf9SStefano Zampini } 4691651b1cf9SStefano Zampini } 46929566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4693651b1cf9SStefano Zampini 4694394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4695394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4696651b1cf9SStefano Zampini jmap[q] = 1; /* Number of repeats of this nonzero entry */ 4697394ed5ebSJunchao Zhang Ai[row] = 1; 4698394ed5ebSJunchao Zhang nnz++; 4699394ed5ebSJunchao Zhang 4700394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4701394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4702394ed5ebSJunchao Zhang q++; 4703394ed5ebSJunchao Zhang jmap[q] = 1; 4704394ed5ebSJunchao Zhang Aj[q] = j[p]; 4705394ed5ebSJunchao Zhang Ai[row]++; 4706394ed5ebSJunchao Zhang nnz++; 4707394ed5ebSJunchao Zhang } else { 4708394ed5ebSJunchao Zhang jmap[q]++; 4709394ed5ebSJunchao Zhang } 4710394ed5ebSJunchao Zhang } 4711394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4712394ed5ebSJunchao Zhang } 4713394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4714394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 4715394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4716394ed5ebSJunchao Zhang jmap[0] = 0; 4717394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 4718394ed5ebSJunchao Zhang if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */ 4719394ed5ebSJunchao Zhang PetscCount *jmap_new; 4720394ed5ebSJunchao Zhang PetscInt *Aj_new; 4721394ed5ebSJunchao Zhang 47229566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 47239566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 47249566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4725394ed5ebSJunchao Zhang jmap = jmap_new; 4726394ed5ebSJunchao Zhang 47279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &Aj_new)); 47289566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 47299566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4730394ed5ebSJunchao Zhang Aj = Aj_new; 4731394ed5ebSJunchao Zhang } 4732394ed5ebSJunchao Zhang 4733394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4734394ed5ebSJunchao Zhang PetscCount *perm_new; 4735cbc6b225SStefano Zampini 47369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 47379566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 47389566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4739394ed5ebSJunchao Zhang perm = perm_new; 4740394ed5ebSJunchao Zhang } 4741394ed5ebSJunchao Zhang 47429566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 47439566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */ 47449566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4745394ed5ebSJunchao Zhang 4746394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4747394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 47482c4ab24aSJunchao Zhang 47492c4ab24aSJunchao Zhang // Put the COO struct in a container and then attach that to the matrix 47502c4ab24aSJunchao Zhang PetscCall(PetscMalloc1(1, &coo)); 47512c4ab24aSJunchao Zhang coo->nz = nnz; 47522c4ab24aSJunchao Zhang coo->n = coo_n; 47532c4ab24aSJunchao Zhang coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again 47542c4ab24aSJunchao Zhang coo->jmap = jmap; // of length nnz+1 47552c4ab24aSJunchao Zhang coo->perm = perm; 47562c4ab24aSJunchao Zhang PetscCall(PetscContainerCreate(PETSC_COMM_SELF, &container)); 47572c4ab24aSJunchao Zhang PetscCall(PetscContainerSetPointer(container, coo)); 47582c4ab24aSJunchao Zhang PetscCall(PetscContainerSetUserDestroy(container, MatCOOStructDestroy_SeqAIJ)); 47592c4ab24aSJunchao Zhang PetscCall(PetscObjectCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", (PetscObject)container)); 47602c4ab24aSJunchao Zhang PetscCall(PetscContainerDestroy(&container)); 47613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4762394ed5ebSJunchao Zhang } 4763394ed5ebSJunchao Zhang 4764d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4765d71ae5a4SJacob Faibussowitsch { 4766394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4767394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 47682c4ab24aSJunchao Zhang PetscCount *perm, *jmap; 4769394ed5ebSJunchao Zhang PetscScalar *Aa; 47702c4ab24aSJunchao Zhang PetscContainer container; 47712c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 4772394ed5ebSJunchao Zhang 4773394ed5ebSJunchao Zhang PetscFunctionBegin; 47742c4ab24aSJunchao Zhang PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container)); 47752c4ab24aSJunchao Zhang PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix"); 47762c4ab24aSJunchao Zhang PetscCall(PetscContainerGetPointer(container, (void **)&coo)); 47772c4ab24aSJunchao Zhang perm = coo->perm; 47782c4ab24aSJunchao Zhang jmap = coo->jmap; 47799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4780394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4781b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4782b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4783b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4784394ed5ebSJunchao Zhang } 47859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 47863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4787394ed5ebSJunchao Zhang } 4788394ed5ebSJunchao Zhang 478934b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47905063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 479102fe1965SBarry Smith #endif 4792d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4793d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *); 4794d5e393b6SSuyash Tandon #endif 47953d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47965063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 47973d0639e7SStefano Zampini #endif 479802fe1965SBarry Smith 4799d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4800d71ae5a4SJacob Faibussowitsch { 4801273d9f13SBarry Smith Mat_SeqAIJ *b; 480238baddfdSBarry Smith PetscMPIInt size; 4803273d9f13SBarry Smith 4804273d9f13SBarry Smith PetscFunctionBegin; 48059566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 480608401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4807273d9f13SBarry Smith 48084dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 48092205254eSKarl Rupp 4810b0a32e0cSBarry Smith B->data = (void *)b; 4811aea10558SJacob Faibussowitsch B->ops[0] = MatOps_Values; 4812071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 48132205254eSKarl Rupp 4814f4259b30SLisandro Dalcin b->row = NULL; 4815f4259b30SLisandro Dalcin b->col = NULL; 4816f4259b30SLisandro Dalcin b->icol = NULL; 4817b810aeb4SBarry Smith b->reallocs = 0; 481836db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4819f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4820416022c9SBarry Smith b->nonew = 0; 4821f4259b30SLisandro Dalcin b->diag = NULL; 4822f4259b30SLisandro Dalcin b->solve_work = NULL; 4823f4259b30SLisandro Dalcin B->spptr = NULL; 4824f4259b30SLisandro Dalcin b->saved_values = NULL; 4825f4259b30SLisandro Dalcin b->idiag = NULL; 4826f4259b30SLisandro Dalcin b->mdiag = NULL; 4827f4259b30SLisandro Dalcin b->ssor_work = NULL; 482871f1c65dSBarry Smith b->omega = 1.0; 482971f1c65dSBarry Smith b->fshift = 0.0; 483071f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4831bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4832a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 483317ab2063SBarry Smith 48349566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4835d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 48369566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 48379566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4838b3866ffcSBarry Smith #endif 48399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 48409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 48419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 48429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 48439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 48449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 48459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 48469779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 48479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4848191b95cbSRichard Tran Mills #endif 484934b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 48519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 485302fe1965SBarry Smith #endif 4854d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4855d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 4856d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 4857d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ)); 4858d5e393b6SSuyash Tandon #endif 48593d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 48613d0639e7SStefano Zampini #endif 48629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4863af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 48649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4865af8000cdSHong Zhang #endif 4866d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 48679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4868d24d4204SJose E. Roman #endif 486963c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 48709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 48719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 487263c07aadSStefano Zampini #endif 48739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 48749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 48759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 48769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 48779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsTranspose_SeqAIJ)); 48789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 48799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 48809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 48819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 48829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 48839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 48849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 48869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 48879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 48889566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 48899566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 48909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 48913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 489217ab2063SBarry Smith } 489317ab2063SBarry Smith 4894b24902e0SBarry Smith /* 48953893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4896b24902e0SBarry Smith */ 4897d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4898d71ae5a4SJacob Faibussowitsch { 48992a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4900071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 490117ab2063SBarry Smith 49023a40ed3dSBarry Smith PetscFunctionBegin; 4903aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4904273d9f13SBarry Smith 4905d5f3da31SBarry Smith C->factortype = A->factortype; 4906f4259b30SLisandro Dalcin c->row = NULL; 4907f4259b30SLisandro Dalcin c->col = NULL; 4908f4259b30SLisandro Dalcin c->icol = NULL; 49096ad4291fSHong Zhang c->reallocs = 0; 491017ab2063SBarry Smith 491169272f91SPierre Jolivet C->assembled = A->assembled; 491217ab2063SBarry Smith 491369272f91SPierre Jolivet if (A->preallocated) { 49149566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 49159566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4916eec197d1SBarry Smith 491731fe6a7dSBarry Smith if (!A->hash_active) { 49189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 49199566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 49209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 49219566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 492217ab2063SBarry Smith 492317ab2063SBarry Smith /* allocate the matrix space */ 4924f77e22a1SHong Zhang if (mallocmatspace) { 49259566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i)); 49262205254eSKarl Rupp 4927f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 49282205254eSKarl Rupp 49299566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 493017ab2063SBarry Smith if (m > 0) { 49319566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4932be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 49332e5835c6SStefano Zampini const PetscScalar *aa; 49342e5835c6SStefano Zampini 49359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 49369566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 49379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 4938be6bf707SBarry Smith } else { 49399566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 494017ab2063SBarry Smith } 494108480c60SBarry Smith } 4942f77e22a1SHong Zhang } 494331fe6a7dSBarry Smith C->preallocated = PETSC_TRUE; 494431fe6a7dSBarry Smith } else { 494531fe6a7dSBarry Smith PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix"); 494631fe6a7dSBarry Smith PetscCall(MatSetUp(C)); 494731fe6a7dSBarry Smith } 494817ab2063SBarry Smith 49496ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4950416022c9SBarry Smith c->roworiented = a->roworiented; 4951416022c9SBarry Smith c->nonew = a->nonew; 4952416022c9SBarry Smith if (a->diag) { 49539566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 49549566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 4955071fcb05SBarry Smith } else c->diag = NULL; 49562205254eSKarl Rupp 4957f4259b30SLisandro Dalcin c->solve_work = NULL; 4958f4259b30SLisandro Dalcin c->saved_values = NULL; 4959f4259b30SLisandro Dalcin c->idiag = NULL; 4960f4259b30SLisandro Dalcin c->ssor_work = NULL; 4961a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4962e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4963e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 49646ad4291fSHong Zhang 4965893ad86cSHong Zhang c->rmax = a->rmax; 4966416022c9SBarry Smith c->nz = a->nz; 49678ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4968754ec7b1SSatish Balay 49696ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 49706ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4971cd6b891eSBarry Smith if (a->compressedrow.use) { 49726ad4291fSHong Zhang i = a->compressedrow.nrows; 49739566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 49749566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 49759566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 497627ea64f8SHong Zhang } else { 497727ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 49780298fd71SBarry Smith c->compressedrow.i = NULL; 49790298fd71SBarry Smith c->compressedrow.rindex = NULL; 49806ad4291fSHong Zhang } 4981ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4982e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 49834846f1f5SKris Buschelman 49849566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 498569272f91SPierre Jolivet } 49869566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 49873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 498817ab2063SBarry Smith } 498917ab2063SBarry Smith 4990d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 4991d71ae5a4SJacob Faibussowitsch { 4992b24902e0SBarry Smith PetscFunctionBegin; 49939566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 49949566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 499548a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 49969566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 49979566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 49983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4999b24902e0SBarry Smith } 5000b24902e0SBarry Smith 5001d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 5002d71ae5a4SJacob Faibussowitsch { 500352f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 500452f91c60SVaclav Hapla 500552f91c60SVaclav Hapla PetscFunctionBegin; 500652f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 500752f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 5008c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 50099566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 50109566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 50119566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 501252f91c60SVaclav Hapla if (isbinary) { 50139566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 501452f91c60SVaclav Hapla } else if (ishdf5) { 501552f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 50169566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 501752f91c60SVaclav Hapla #else 501852f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 501952f91c60SVaclav Hapla #endif 502052f91c60SVaclav Hapla } else { 502198921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 502252f91c60SVaclav Hapla } 50233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 502452f91c60SVaclav Hapla } 502552f91c60SVaclav Hapla 5026d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 5027d71ae5a4SJacob Faibussowitsch { 50283ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 50293ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 5030fbdbba38SShri Abhyankar 5031fbdbba38SShri Abhyankar PetscFunctionBegin; 50329566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 5033bbead8a2SBarry Smith 50343ea6fe3dSLisandro Dalcin /* read in matrix header */ 50359566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 503608401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 50379371c9d4SSatish Balay M = header[1]; 50389371c9d4SSatish Balay N = header[2]; 50399371c9d4SSatish Balay nz = header[3]; 504008401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 504108401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 504208401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 5043fbdbba38SShri Abhyankar 50443ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 50459566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 50463ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 50473ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 50483ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 50493ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 50503ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 50519566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 50529566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 50533ea6fe3dSLisandro Dalcin 50543ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 50559566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5056aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 50573ea6fe3dSLisandro Dalcin 5058fbdbba38SShri Abhyankar /* read in row lengths */ 50599566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 50609566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 50613ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 50629371c9d4SSatish Balay sum = 0; 50639371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 506408401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 50653ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 50669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 50679566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5068aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 50693ea6fe3dSLisandro Dalcin /* store row lengths */ 50709566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 50719566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5072fbdbba38SShri Abhyankar 50733ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 50749371c9d4SSatish Balay a->i[0] = 0; 50759371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 50763ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 50779566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 50783ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 50799566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5080fbdbba38SShri Abhyankar 50819566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 50829566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 50833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5084fbdbba38SShri Abhyankar } 5085fbdbba38SShri Abhyankar 5086d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5087d71ae5a4SJacob Faibussowitsch { 50887264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5089fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5090eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5091eeffb40dSHong Zhang PetscInt k; 5092eeffb40dSHong Zhang #endif 50937264ac53SSatish Balay 50943a40ed3dSBarry Smith PetscFunctionBegin; 5095bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5096d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5097ca44d042SBarry Smith *flg = PETSC_FALSE; 50983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5099bcd2baecSBarry Smith } 51007264ac53SSatish Balay 51017264ac53SSatish Balay /* if the a->i are the same */ 51029566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 51033ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 51047264ac53SSatish Balay 51057264ac53SSatish Balay /* if a->j are the same */ 51069566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 51073ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 5108bcd2baecSBarry Smith 51099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 51109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5111bcd2baecSBarry Smith /* if a->a are the same */ 5112eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5113eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5114fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5115eeffb40dSHong Zhang *flg = PETSC_FALSE; 51163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5117eeffb40dSHong Zhang } 5118eeffb40dSHong Zhang } 5119eeffb40dSHong Zhang #else 51209566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5121eeffb40dSHong Zhang #endif 51229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 51239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 51243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51257264ac53SSatish Balay } 512636db0b34SBarry Smith 512705869f15SSatish Balay /*@ 512811a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 512936db0b34SBarry Smith provided by the user. 513036db0b34SBarry Smith 5131d083f849SBarry Smith Collective 513236db0b34SBarry Smith 513336db0b34SBarry Smith Input Parameters: 513436db0b34SBarry Smith + comm - must be an MPI communicator of size 1 513536db0b34SBarry Smith . m - number of rows 513636db0b34SBarry Smith . n - number of columns 5137483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 513836db0b34SBarry Smith . j - column indices 513936db0b34SBarry Smith - a - matrix values 514036db0b34SBarry Smith 514136db0b34SBarry Smith Output Parameter: 514236db0b34SBarry Smith . mat - the matrix 514336db0b34SBarry Smith 514436db0b34SBarry Smith Level: intermediate 514536db0b34SBarry Smith 514636db0b34SBarry Smith Notes: 51472ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 5148292fb18eSBarry Smith once the matrix is destroyed and not before 514936db0b34SBarry Smith 515036db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 515136db0b34SBarry Smith 51522ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 515336db0b34SBarry Smith 5154a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5155a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 51568eef79e4SBarry Smith as shown 51572ef1f0ffSBarry Smith .vb 51582ef1f0ffSBarry Smith 1 0 0 51592ef1f0ffSBarry Smith 2 0 3 51602ef1f0ffSBarry Smith 4 5 6 5161a4552177SSatish Balay 51622ef1f0ffSBarry Smith i = {0,1,3,6} [size = nrow+1 = 3+1] 51632ef1f0ffSBarry Smith j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 51642ef1f0ffSBarry Smith v = {1,2,3,4,5,6} [size = 6] 51652ef1f0ffSBarry Smith .ve 5166a4552177SSatish Balay 51671cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 516836db0b34SBarry Smith @*/ 5169d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5170d71ae5a4SJacob Faibussowitsch { 5171cbcfb4deSHong Zhang PetscInt ii; 517236db0b34SBarry Smith Mat_SeqAIJ *aij; 5173cbcfb4deSHong Zhang PetscInt jj; 517436db0b34SBarry Smith 517536db0b34SBarry Smith PetscFunctionBegin; 5176aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 51779566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51789566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51799566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 51809566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5182ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 51839566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 51849566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5185ab93d7beSBarry Smith 518636db0b34SBarry Smith aij->i = i; 518736db0b34SBarry Smith aij->j = j; 518836db0b34SBarry Smith aij->a = a; 518936db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 519036db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5191e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5192e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 519336db0b34SBarry Smith 5194cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 519536db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 519676bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5197aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 51989985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 519908401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 520008401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 52019985e31cSBarry Smith } 520236db0b34SBarry Smith } 520376bd3646SJed Brown } 520476bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 520536db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 520608401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5207aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 520836db0b34SBarry Smith } 520976bd3646SJed Brown } 521036db0b34SBarry Smith 52119566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52129566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 521436db0b34SBarry Smith } 5215cbc6b225SStefano Zampini 5216f62e3866SBarry Smith /*@ 521711a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 52188a0b0e6bSVictor Minden provided by the user. 52198a0b0e6bSVictor Minden 5220d083f849SBarry Smith Collective 52218a0b0e6bSVictor Minden 52228a0b0e6bSVictor Minden Input Parameters: 52238a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 52248a0b0e6bSVictor Minden . m - number of rows 52258a0b0e6bSVictor Minden . n - number of columns 52268a0b0e6bSVictor Minden . i - row indices 52278a0b0e6bSVictor Minden . j - column indices 52281230e6d1SVictor Minden . a - matrix values 52291230e6d1SVictor Minden . nz - number of nonzeros 52302ef1f0ffSBarry Smith - idx - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 52318a0b0e6bSVictor Minden 52328a0b0e6bSVictor Minden Output Parameter: 52338a0b0e6bSVictor Minden . mat - the matrix 52348a0b0e6bSVictor Minden 52358a0b0e6bSVictor Minden Level: intermediate 52368a0b0e6bSVictor Minden 5237f62e3866SBarry Smith Example: 5238f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 52399e99939fSJunchao Zhang .vb 52408a0b0e6bSVictor Minden 1 0 0 52418a0b0e6bSVictor Minden 2 0 3 52428a0b0e6bSVictor Minden 4 5 6 52438a0b0e6bSVictor Minden 52448a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 52458a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 52468a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 52479e99939fSJunchao Zhang .ve 5248fe59aa6dSJacob Faibussowitsch 52492ef1f0ffSBarry Smith Note: 5250d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5251d7547e51SJunchao Zhang and are particularly useful in iterative applications. 52528a0b0e6bSVictor Minden 52531cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 52548a0b0e6bSVictor Minden @*/ 5255d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5256d71ae5a4SJacob Faibussowitsch { 5257d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 52588a0b0e6bSVictor Minden 52598a0b0e6bSVictor Minden PetscFunctionBegin; 52609566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5261ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 52629566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 52639566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 52649566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 52659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 52661230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 52671230e6d1SVictor Minden if (idx) { 52681230e6d1SVictor Minden row = i[ii] - 1; 52691230e6d1SVictor Minden col = j[ii] - 1; 52701230e6d1SVictor Minden } else { 52711230e6d1SVictor Minden row = i[ii]; 52721230e6d1SVictor Minden col = j[ii]; 52738a0b0e6bSVictor Minden } 52749566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 52758a0b0e6bSVictor Minden } 52769566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52779566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52789566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 52793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52808a0b0e6bSVictor Minden } 528136db0b34SBarry Smith 5282d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5283d71ae5a4SJacob Faibussowitsch { 5284acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5285acf2f550SJed Brown 5286acf2f550SJed Brown PetscFunctionBegin; 5287acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5288acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 52892205254eSKarl Rupp 52909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 52913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5292acf2f550SJed Brown } 5293acf2f550SJed Brown 5294d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5295d71ae5a4SJacob Faibussowitsch { 52969c8f2541SHong Zhang PetscFunctionBegin; 52979566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 52983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52999c8f2541SHong Zhang } 53009c8f2541SHong Zhang 530181824310SBarry Smith /* 530253dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 530353dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 530453dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 530553dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 530653dd7562SDmitry Karpeev */ 5307d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5308d71ae5a4SJacob Faibussowitsch { 530953dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 531053dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 531153dd7562SDmitry Karpeev PetscBool seqaij; 531253dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 531353dd7562SDmitry Karpeev PetscScalar v; 531453dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 531553dd7562SDmitry Karpeev 531653dd7562SDmitry Karpeev PetscFunctionBegin; 53173ba16761SJacob Faibussowitsch if (!B) PetscFunctionReturn(PETSC_SUCCESS); 531853dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 53199566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 532028b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 532153dd7562SDmitry Karpeev if (rowemb) { 53229566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 532308401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 532453dd7562SDmitry Karpeev } else { 532508401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 532653dd7562SDmitry Karpeev } 532753dd7562SDmitry Karpeev if (colemb) { 53289566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 532908401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 533053dd7562SDmitry Karpeev } else { 533108401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 533253dd7562SDmitry Karpeev } 533353dd7562SDmitry Karpeev 533453dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ *)(B->data); 533553dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 53369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5337ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 53389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 53399566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 534053dd7562SDmitry Karpeev } 534148a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 534253dd7562SDmitry Karpeev count = 0; 534353dd7562SDmitry Karpeev rowindices = NULL; 534453dd7562SDmitry Karpeev colindices = NULL; 534548a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 534648a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 534753dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 534853dd7562SDmitry Karpeev PetscInt row; 534953dd7562SDmitry Karpeev row = i; 535053dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 535153dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 535253dd7562SDmitry Karpeev PetscInt col; 535353dd7562SDmitry Karpeev col = Baij->j[count]; 535453dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 535553dd7562SDmitry Karpeev v = Baij->a[count]; 53569566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 535753dd7562SDmitry Karpeev ++count; 535853dd7562SDmitry Karpeev } 535953dd7562SDmitry Karpeev } 536053dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 536153dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 536253dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 536353dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 536453dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 53653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 536653dd7562SDmitry Karpeev } 536753dd7562SDmitry Karpeev 536858c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep) 5369dec0b466SHong Zhang { 5370dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5371dec0b466SHong Zhang MatScalar *aa = a->a; 5372dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5373dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5374dec0b466SHong Zhang 5375dec0b466SHong Zhang PetscFunctionBegin; 5376dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5377dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5378dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5379dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5380dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 538158c11ad4SPierre Jolivet if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++; 5382dec0b466SHong Zhang else { 5383dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5384dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5385dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5386dec0b466SHong Zhang } 5387dec0b466SHong Zhang } 5388dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5389dec0b466SHong Zhang fshift_prev = fshift; 5390dec0b466SHong Zhang /* reset ilen and imax for each row */ 5391dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5392dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5393dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5394dec0b466SHong Zhang } 5395312eded4SPierre Jolivet if (fshift) { 5396dec0b466SHong Zhang if (m) { 5397dec0b466SHong Zhang ai[m] -= fshift; 5398dec0b466SHong Zhang a->nz = ai[m]; 5399dec0b466SHong Zhang } 5400dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5401312eded4SPierre Jolivet A->nonzerostate++; 5402dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5403dec0b466SHong Zhang a->rmax = rmax; 5404dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5405dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5406dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 5407312eded4SPierre Jolivet } 54083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5409dec0b466SHong Zhang } 5410dec0b466SHong Zhang 54114099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 54124099cc6bSBarry Smith 54134099cc6bSBarry Smith /*@C 541411a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 54154099cc6bSBarry Smith 5416c3339decSBarry Smith Collective 54174099cc6bSBarry Smith 54184099cc6bSBarry Smith Input Parameters: 54194099cc6bSBarry Smith + mat - the matrix object 54204099cc6bSBarry Smith - matype - matrix type 54214099cc6bSBarry Smith 54224099cc6bSBarry Smith Options Database Key: 54234e187271SRichard Tran Mills . -mat_seqaij_type <method> - for example seqaijcrl 54244099cc6bSBarry Smith 54254099cc6bSBarry Smith Level: intermediate 54264099cc6bSBarry Smith 5427fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType` 54284099cc6bSBarry Smith @*/ 5429d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5430d71ae5a4SJacob Faibussowitsch { 54314099cc6bSBarry Smith PetscBool sametype; 54325f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 54334099cc6bSBarry Smith 54344099cc6bSBarry Smith PetscFunctionBegin; 54354099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 54369566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 54373ba16761SJacob Faibussowitsch if (sametype) PetscFunctionReturn(PETSC_SUCCESS); 54384099cc6bSBarry Smith 54399566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 54406adde796SStefano Zampini PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 54419566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 54423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54434099cc6bSBarry Smith } 54444099cc6bSBarry Smith 54454099cc6bSBarry Smith /*@C 544611a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 54474099cc6bSBarry Smith 54484099cc6bSBarry Smith Not Collective 54494099cc6bSBarry Smith 54504099cc6bSBarry Smith Input Parameters: 5451fe59aa6dSJacob Faibussowitsch + sname - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 54524099cc6bSBarry Smith - function - routine to convert to subtype 54534099cc6bSBarry Smith 54542ef1f0ffSBarry Smith Level: advanced 54552ef1f0ffSBarry Smith 54564099cc6bSBarry Smith Notes: 545711a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 54584099cc6bSBarry Smith 54594099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 54604099cc6bSBarry Smith $ -mat_seqaij_type my_mat 54614099cc6bSBarry Smith 54621cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()` 54634099cc6bSBarry Smith @*/ 5464d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5465d71ae5a4SJacob Faibussowitsch { 54664099cc6bSBarry Smith PetscFunctionBegin; 54679566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 54689566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 54693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54704099cc6bSBarry Smith } 54714099cc6bSBarry Smith 54724099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 54734099cc6bSBarry Smith 54744099cc6bSBarry Smith /*@C 547511a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 54764099cc6bSBarry Smith 54774099cc6bSBarry Smith Not Collective 54784099cc6bSBarry Smith 54794099cc6bSBarry Smith Level: advanced 54804099cc6bSBarry Smith 54812ef1f0ffSBarry Smith Note: 54822ef1f0ffSBarry Smith This registers the versions of `MATSEQAIJ` for GPUs 54832ef1f0ffSBarry Smith 54841cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()` 54854099cc6bSBarry Smith @*/ 5486d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5487d71ae5a4SJacob Faibussowitsch { 54884099cc6bSBarry Smith PetscFunctionBegin; 54893ba16761SJacob Faibussowitsch if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS); 54904099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 54914099cc6bSBarry Smith 54929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 54939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 54949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 54959779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 54969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5497485f9817SRichard Tran Mills #endif 54985063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 54999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 55005063d097SStefano Zampini #endif 5501d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 5502d5e393b6SSuyash Tandon PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 5503d5e393b6SSuyash Tandon #endif 55045063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 55059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 55065063d097SStefano Zampini #endif 55074099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 55089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 55094099cc6bSBarry Smith #endif 55103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55114099cc6bSBarry Smith } 551253dd7562SDmitry Karpeev 551353dd7562SDmitry Karpeev /* 551481824310SBarry Smith Special version for direct calls from Fortran 551581824310SBarry Smith */ 5516af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 551781824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 551881824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 551981824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 552081824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 552181824310SBarry Smith #endif 552281824310SBarry Smith 552381824310SBarry Smith /* Change these macros so can be used in void function */ 552498921bdaSJacob Faibussowitsch 552598921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 55269566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 55279566063dSJacob Faibussowitsch #undef PetscCall 55289371c9d4SSatish Balay #define PetscCall(...) \ 55299371c9d4SSatish Balay do { \ 55305f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 553198921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 553298921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 553398921bdaSJacob Faibussowitsch return; \ 553498921bdaSJacob Faibussowitsch } \ 553598921bdaSJacob Faibussowitsch } while (0) 553698921bdaSJacob Faibussowitsch 553798921bdaSJacob Faibussowitsch #undef SETERRQ 55389371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 55399371c9d4SSatish Balay do { \ 554098921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 554198921bdaSJacob Faibussowitsch return; \ 554298921bdaSJacob Faibussowitsch } while (0) 554381824310SBarry Smith 5544d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5545d71ae5a4SJacob Faibussowitsch { 554681824310SBarry Smith Mat A = *AA; 554781824310SBarry Smith PetscInt m = *mm, n = *nn; 554881824310SBarry Smith InsertMode is = *isis; 554981824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 555081824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 555181824310SBarry Smith PetscInt *imax, *ai, *ailen; 555281824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 555354f21887SBarry Smith MatScalar *ap, value, *aa; 5554ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5555ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 555681824310SBarry Smith 555781824310SBarry Smith PetscFunctionBegin; 55584994cf47SJed Brown MatCheckPreallocated(A, 1); 555981824310SBarry Smith imax = a->imax; 556081824310SBarry Smith ai = a->i; 556181824310SBarry Smith ailen = a->ilen; 556281824310SBarry Smith aj = a->j; 556381824310SBarry Smith aa = a->a; 556481824310SBarry Smith 556581824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 556681824310SBarry Smith row = im[k]; 556781824310SBarry Smith if (row < 0) continue; 55685f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 55699371c9d4SSatish Balay rp = aj + ai[row]; 55709371c9d4SSatish Balay ap = aa + ai[row]; 55719371c9d4SSatish Balay rmax = imax[row]; 55729371c9d4SSatish Balay nrow = ailen[row]; 557381824310SBarry Smith low = 0; 557481824310SBarry Smith high = nrow; 557581824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 557681824310SBarry Smith if (in[l] < 0) continue; 55775f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 557881824310SBarry Smith col = in[l]; 55792205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 55802205254eSKarl Rupp else value = v[k + l * m]; 55812205254eSKarl Rupp 558281824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 558381824310SBarry Smith 55842205254eSKarl Rupp if (col <= lastcol) low = 0; 55852205254eSKarl Rupp else high = nrow; 558681824310SBarry Smith lastcol = col; 558781824310SBarry Smith while (high - low > 5) { 558881824310SBarry Smith t = (low + high) / 2; 558981824310SBarry Smith if (rp[t] > col) high = t; 559081824310SBarry Smith else low = t; 559181824310SBarry Smith } 559281824310SBarry Smith for (i = low; i < high; i++) { 559381824310SBarry Smith if (rp[i] > col) break; 559481824310SBarry Smith if (rp[i] == col) { 559581824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 559681824310SBarry Smith else ap[i] = value; 559781824310SBarry Smith goto noinsert; 559881824310SBarry Smith } 559981824310SBarry Smith } 560081824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 560181824310SBarry Smith if (nonew == 1) goto noinsert; 56025f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5603fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 56049371c9d4SSatish Balay N = nrow++ - 1; 56059371c9d4SSatish Balay a->nz++; 56069371c9d4SSatish Balay high++; 560781824310SBarry Smith /* shift up all the later entries in this row */ 560881824310SBarry Smith for (ii = N; ii >= i; ii--) { 560981824310SBarry Smith rp[ii + 1] = rp[ii]; 561081824310SBarry Smith ap[ii + 1] = ap[ii]; 561181824310SBarry Smith } 561281824310SBarry Smith rp[i] = col; 561381824310SBarry Smith ap[i] = value; 5614e56f5c9eSBarry Smith A->nonzerostate++; 561581824310SBarry Smith noinsert:; 561681824310SBarry Smith low = i + 1; 561781824310SBarry Smith } 561881824310SBarry Smith ailen[row] = nrow; 561981824310SBarry Smith } 562081824310SBarry Smith PetscFunctionReturnVoid(); 562181824310SBarry Smith } 562298921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 562398921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 562498921bdaSJacob Faibussowitsch * original definitions */ 56259566063dSJacob Faibussowitsch #undef PetscCall 562698921bdaSJacob Faibussowitsch #undef SETERRQ 5627