1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1226cec326SBarry Smith #define TYPE AIJ 1326cec326SBarry Smith #define TYPE_BS 1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 1626cec326SBarry Smith #undef TYPE 1726cec326SBarry Smith #undef TYPE_BS 1826cec326SBarry Smith 19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 20d71ae5a4SJacob Faibussowitsch { 214099cc6bSBarry Smith PetscBool flg; 224099cc6bSBarry Smith char type[256]; 234099cc6bSBarry Smith 244099cc6bSBarry Smith PetscFunctionBegin; 25d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 269566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 279566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 28d0609cedSBarry Smith PetscOptionsEnd(); 293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 304099cc6bSBarry Smith } 314099cc6bSBarry Smith 32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 33d71ae5a4SJacob Faibussowitsch { 340716a85fSBarry Smith PetscInt i, m, n; 350716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 360716a85fSBarry Smith 370716a85fSBarry Smith PetscFunctionBegin; 389566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 399566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 400716a85fSBarry Smith if (type == NORM_2) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 420716a85fSBarry Smith } else if (type == NORM_1) { 43ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 440716a85fSBarry Smith } else if (type == NORM_INFINITY) { 45ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 47ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 506adde796SStefano Zampini } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 510716a85fSBarry Smith 520716a85fSBarry Smith if (type == NORM_2) { 53a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 54857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 55a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 560716a85fSBarry Smith } 573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 580716a85fSBarry Smith } 590716a85fSBarry Smith 60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 61d71ae5a4SJacob Faibussowitsch { 623a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 633a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 643a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 653a062f41SBarry Smith PetscInt *rows; 663a062f41SBarry Smith 673a062f41SBarry Smith PetscFunctionBegin; 683a062f41SBarry Smith for (i = 0; i < m; i++) { 69ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 723a062f41SBarry Smith cnt = 0; 733a062f41SBarry Smith for (i = 0; i < m; i++) { 743a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 753a062f41SBarry Smith rows[cnt] = i; 763a062f41SBarry Smith cnt++; 773a062f41SBarry Smith } 783a062f41SBarry Smith } 799566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 813a062f41SBarry Smith } 823a062f41SBarry Smith 83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 84d71ae5a4SJacob Faibussowitsch { 856ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 86fff043a9SJunchao Zhang const MatScalar *aa; 876ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 88b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 896ce1633cSBarry Smith PetscInt *rows; 906ce1633cSBarry Smith 916ce1633cSBarry Smith PetscFunctionBegin; 929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 939566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 946ce1633cSBarry Smith diag = a->diag; 956ce1633cSBarry Smith for (i = 0; i < m; i++) { 96ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 976ce1633cSBarry Smith } 989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 996ce1633cSBarry Smith cnt = 0; 1006ce1633cSBarry Smith for (i = 0; i < m; i++) { 101ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 1026ce1633cSBarry Smith } 103f1f41ecbSJed Brown *nrows = cnt; 104f1f41ecbSJed Brown *zrows = rows; 1059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 107f1f41ecbSJed Brown } 108f1f41ecbSJed Brown 109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 110d71ae5a4SJacob Faibussowitsch { 111f1f41ecbSJed Brown PetscInt nrows, *rows; 112f1f41ecbSJed Brown 113f1f41ecbSJed Brown PetscFunctionBegin; 1140298fd71SBarry Smith *zrows = NULL; 1159566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1169566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1186ce1633cSBarry Smith } 1196ce1633cSBarry Smith 120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 121d71ae5a4SJacob Faibussowitsch { 122b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 123b3a44c85SBarry Smith const MatScalar *aa; 124b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 125b3a44c85SBarry Smith const PetscInt *ii; 126b3a44c85SBarry Smith PetscInt n, i, j, *rows; 127b3a44c85SBarry Smith 128b3a44c85SBarry Smith PetscFunctionBegin; 1299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 130f4259b30SLisandro Dalcin *keptrows = NULL; 131b3a44c85SBarry Smith ii = a->i; 132b3a44c85SBarry Smith for (i = 0; i < m; i++) { 133b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 134b3a44c85SBarry Smith if (!n) { 135b3a44c85SBarry Smith cnt++; 136b3a44c85SBarry Smith goto ok1; 137b3a44c85SBarry Smith } 1382e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 139b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 140b3a44c85SBarry Smith } 141b3a44c85SBarry Smith cnt++; 142b3a44c85SBarry Smith ok1:; 143b3a44c85SBarry Smith } 1442e5835c6SStefano Zampini if (!cnt) { 1459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1472e5835c6SStefano Zampini } 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 149b3a44c85SBarry Smith cnt = 0; 150b3a44c85SBarry Smith for (i = 0; i < m; i++) { 151b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 152b3a44c85SBarry Smith if (!n) continue; 1532e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 154b3a44c85SBarry Smith if (aa[j] != 0.0) { 155b3a44c85SBarry Smith rows[cnt++] = i; 156b3a44c85SBarry Smith break; 157b3a44c85SBarry Smith } 158b3a44c85SBarry Smith } 159b3a44c85SBarry Smith } 1609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1619566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 1623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 163b3a44c85SBarry Smith } 164b3a44c85SBarry Smith 165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 166d71ae5a4SJacob Faibussowitsch { 16779299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16899e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16999e65526SBarry Smith const PetscInt *diag; 1702e5835c6SStefano Zampini MatScalar *aa; 17199e65526SBarry Smith const PetscScalar *v; 172ace3abfcSBarry Smith PetscBool missing; 17379299369SBarry Smith 17479299369SBarry Smith PetscFunctionBegin; 17509f38230SBarry Smith if (Y->assembled) { 1769566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 17709f38230SBarry Smith if (!missing) { 17879299369SBarry Smith diag = aij->diag; 1799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 18179299369SBarry Smith if (is == INSERT_VALUES) { 182ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 18379299369SBarry Smith } else { 184ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 18579299369SBarry Smith } 1869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 1883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18979299369SBarry Smith } 1909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 19109f38230SBarry Smith } 1929566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 1933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 19409f38230SBarry Smith } 19579299369SBarry Smith 196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 197d71ae5a4SJacob Faibussowitsch { 198416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19997f1f81fSBarry Smith PetscInt i, ishift; 20017ab2063SBarry Smith 2013a40ed3dSBarry Smith PetscFunctionBegin; 202f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 2033ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 204bfeeae90SHong Zhang ishift = 0; 205b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 2069566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 207bfeeae90SHong Zhang } else if (oshift == 1) { 2081a83f524SJed Brown PetscInt *tia; 209d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2103b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2121a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2131a83f524SJed Brown *ia = tia; 214ecc77c7aSBarry Smith if (ja) { 2151a83f524SJed Brown PetscInt *tja; 2169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2171a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2181a83f524SJed Brown *ja = tja; 219ecc77c7aSBarry Smith } 2206945ee14SBarry Smith } else { 221ecc77c7aSBarry Smith *ia = a->i; 222ecc77c7aSBarry Smith if (ja) *ja = a->j; 223a2ce50c7SBarry Smith } 2243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225a2744918SBarry Smith } 226a2744918SBarry Smith 227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 228d71ae5a4SJacob Faibussowitsch { 2293a40ed3dSBarry Smith PetscFunctionBegin; 2303ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 231b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2329566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2339566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 234bcd2baecSBarry Smith } 2353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23617ab2063SBarry Smith } 23717ab2063SBarry Smith 238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 239d71ae5a4SJacob Faibussowitsch { 2403b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 241d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 24297f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2433b2fbd54SBarry Smith 2443a40ed3dSBarry Smith PetscFunctionBegin; 245899cda47SBarry Smith *nn = n; 2463ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2473b2fbd54SBarry Smith if (symmetric) { 2489566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2493b2fbd54SBarry Smith } else { 2509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2533b2fbd54SBarry Smith jj = a->j; 254ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2553b2fbd54SBarry Smith cia[0] = oshift; 256ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2583b2fbd54SBarry Smith jj = a->j; 259a93ec695SBarry Smith for (row = 0; row < m; row++) { 260a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 261a93ec695SBarry Smith for (i = 0; i < mr; i++) { 262bfeeae90SHong Zhang col = *jj++; 2632205254eSKarl Rupp 2643b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2653b2fbd54SBarry Smith } 2663b2fbd54SBarry Smith } 2679566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2689371c9d4SSatish Balay *ia = cia; 2699371c9d4SSatish Balay *ja = cja; 2703b2fbd54SBarry Smith } 2713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2723b2fbd54SBarry Smith } 2733b2fbd54SBarry Smith 274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 275d71ae5a4SJacob Faibussowitsch { 2763a40ed3dSBarry Smith PetscFunctionBegin; 2773ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2783b2fbd54SBarry Smith 2799566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2809566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2823b2fbd54SBarry Smith } 2833b2fbd54SBarry Smith 2847cee066cSHong Zhang /* 2857cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2867cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 287040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2887cee066cSHong Zhang */ 289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 290d71ae5a4SJacob Faibussowitsch { 2917cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2927cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 293071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2947cee066cSHong Zhang PetscInt *cspidx; 295071fcb05SBarry Smith const PetscInt *jj; 2967cee066cSHong Zhang 2977cee066cSHong Zhang PetscFunctionBegin; 2987cee066cSHong Zhang *nn = n; 2993ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 300625f6d37SHong Zhang 3019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 3029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 3039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 3057cee066cSHong Zhang jj = a->j; 306ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 3077cee066cSHong Zhang cia[0] = oshift; 308ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3107cee066cSHong Zhang jj = a->j; 3117cee066cSHong Zhang for (row = 0; row < m; row++) { 3127cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3137cee066cSHong Zhang for (i = 0; i < mr; i++) { 3147cee066cSHong Zhang col = *jj++; 315071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 316071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 317071fcb05SBarry Smith cja[tmp] = row + oshift; 3187cee066cSHong Zhang } 3197cee066cSHong Zhang } 3209566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 321071fcb05SBarry Smith *ia = cia; 322071fcb05SBarry Smith *ja = cja; 3237cee066cSHong Zhang *spidx = cspidx; 3243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 328d71ae5a4SJacob Faibussowitsch { 3297cee066cSHong Zhang PetscFunctionBegin; 3309566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3319566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3337cee066cSHong Zhang } 3347cee066cSHong Zhang 335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 336d71ae5a4SJacob Faibussowitsch { 33787d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33887d4246cSBarry Smith PetscInt *ai = a->i; 339fff043a9SJunchao Zhang PetscScalar *aa; 34087d4246cSBarry Smith 34187d4246cSBarry Smith PetscFunctionBegin; 3429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34687d4246cSBarry Smith } 34787d4246cSBarry Smith 348bd04181cSBarry Smith /* 349bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 350bd04181cSBarry Smith 351bd04181cSBarry Smith - a single row of values is set with each call 352bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 353bd04181cSBarry Smith - the values are always added to the matrix, not set 354bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 355bd04181cSBarry Smith 3561f763a69SBarry Smith This does NOT assume the global column indices are sorted 357bd04181cSBarry Smith 3581f763a69SBarry Smith */ 359bd04181cSBarry Smith 360af0996ceSBarry Smith #include <petsc/private/isimpl.h> 361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 362d71ae5a4SJacob Faibussowitsch { 363189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3641f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3651f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3661f763a69SBarry Smith PetscInt lastcol = -1; 367fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 368189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 369189e4007SBarry Smith 370fff043a9SJunchao Zhang PetscFunctionBegin; 3719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 372f38dd0b8SBarry Smith row = ridx[im[0]]; 3731f763a69SBarry Smith rp = aj + ai[row]; 3741f763a69SBarry Smith ap = aa + ai[row]; 3751f763a69SBarry Smith nrow = ailen[row]; 376189e4007SBarry Smith low = 0; 377189e4007SBarry Smith high = nrow; 378189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 379189e4007SBarry Smith col = cidx[in[l]]; 380f38dd0b8SBarry Smith value = v[l]; 381189e4007SBarry Smith 382189e4007SBarry Smith if (col <= lastcol) low = 0; 383189e4007SBarry Smith else high = nrow; 384189e4007SBarry Smith lastcol = col; 385189e4007SBarry Smith while (high - low > 5) { 386189e4007SBarry Smith t = (low + high) / 2; 387189e4007SBarry Smith if (rp[t] > col) high = t; 388189e4007SBarry Smith else low = t; 389189e4007SBarry Smith } 390189e4007SBarry Smith for (i = low; i < high; i++) { 391189e4007SBarry Smith if (rp[i] == col) { 3921f763a69SBarry Smith ap[i] += value; 393189e4007SBarry Smith low = i + 1; 3941f763a69SBarry Smith break; 395189e4007SBarry Smith } 396189e4007SBarry Smith } 397189e4007SBarry Smith } 3989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3993ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 400189e4007SBarry Smith } 401189e4007SBarry Smith 402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 403d71ae5a4SJacob Faibussowitsch { 404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 405e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 40697f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 407e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 408ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 409ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 410ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 41117ab2063SBarry Smith 4123a40ed3dSBarry Smith PetscFunctionBegin; 4139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 41417ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 415416022c9SBarry Smith row = im[k]; 4165ef9f2a5SBarry Smith if (row < 0) continue; 4176bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 4188e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 4198e3a54c0SPierre Jolivet if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]); 4209371c9d4SSatish Balay rmax = imax[row]; 4219371c9d4SSatish Balay nrow = ailen[row]; 422416022c9SBarry Smith low = 0; 423c71e6ed7SBarry Smith high = nrow; 42417ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4255ef9f2a5SBarry Smith if (in[l] < 0) continue; 4266bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 427bfeeae90SHong Zhang col = in[l]; 428071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 429071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 43036db0b34SBarry Smith 4312205254eSKarl Rupp if (col <= lastcol) low = 0; 4322205254eSKarl Rupp else high = nrow; 433e2ee6c50SBarry Smith lastcol = col; 434416022c9SBarry Smith while (high - low > 5) { 435416022c9SBarry Smith t = (low + high) / 2; 436416022c9SBarry Smith if (rp[t] > col) high = t; 437416022c9SBarry Smith else low = t; 43817ab2063SBarry Smith } 439416022c9SBarry Smith for (i = low; i < high; i++) { 44017ab2063SBarry Smith if (rp[i] > col) break; 44117ab2063SBarry Smith if (rp[i] == col) { 442876c6284SHong Zhang if (!A->structure_only) { 4430c0d7e18SFande Kong if (is == ADD_VALUES) { 4440c0d7e18SFande Kong ap[i] += value; 4450c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4469371c9d4SSatish Balay } else ap[i] = value; 447720833daSHong Zhang } 448e44c0bd4SBarry Smith low = i + 1; 44917ab2063SBarry Smith goto noinsert; 45017ab2063SBarry Smith } 45117ab2063SBarry Smith } 452dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 453c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 45408401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 455720833daSHong Zhang if (A->structure_only) { 456876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 457720833daSHong Zhang } else { 458fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 459720833daSHong Zhang } 4609371c9d4SSatish Balay N = nrow++ - 1; 4619371c9d4SSatish Balay a->nz++; 4629371c9d4SSatish Balay high++; 463416022c9SBarry Smith /* shift up all the later entries in this row */ 4649566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 46517ab2063SBarry Smith rp[i] = col; 466580bdb30SBarry Smith if (!A->structure_only) { 4679566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 468580bdb30SBarry Smith ap[i] = value; 469580bdb30SBarry Smith } 470416022c9SBarry Smith low = i + 1; 471e44c0bd4SBarry Smith noinsert:; 47217ab2063SBarry Smith } 47317ab2063SBarry Smith ailen[row] = nrow; 47417ab2063SBarry Smith } 4759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 47717ab2063SBarry Smith } 47817ab2063SBarry Smith 479ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 480d71ae5a4SJacob Faibussowitsch { 48119b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 48219b08ed1SBarry Smith PetscInt *rp, k, row; 48319b08ed1SBarry Smith PetscInt *ai = a->i; 48419b08ed1SBarry Smith PetscInt *aj = a->j; 485fff043a9SJunchao Zhang MatScalar *aa, *ap; 48619b08ed1SBarry Smith 48719b08ed1SBarry Smith PetscFunctionBegin; 48828b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 48908401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 490fff043a9SJunchao Zhang 4919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 49219b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 49319b08ed1SBarry Smith row = im[k]; 49419b08ed1SBarry Smith rp = aj + ai[row]; 4958e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 49619b08ed1SBarry Smith 4979566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49819b08ed1SBarry Smith if (!A->structure_only) { 49919b08ed1SBarry Smith if (v) { 5009566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 50119b08ed1SBarry Smith v += n; 50219b08ed1SBarry Smith } else { 5039566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 50419b08ed1SBarry Smith } 50519b08ed1SBarry Smith } 50619b08ed1SBarry Smith a->ilen[row] = n; 50719b08ed1SBarry Smith a->imax[row] = n; 50819b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 50919b08ed1SBarry Smith a->nz += n; 51019b08ed1SBarry Smith } 5119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51319b08ed1SBarry Smith } 51419b08ed1SBarry Smith 51519b08ed1SBarry Smith /*@ 51619b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51719b08ed1SBarry Smith 51819b08ed1SBarry Smith Input Parameters: 51911a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 52019b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 52119b08ed1SBarry Smith 52219b08ed1SBarry Smith Level: advanced 52319b08ed1SBarry Smith 52419b08ed1SBarry Smith Notes: 52519b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 52611a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52719b08ed1SBarry Smith as always with multiple matrix assemblies. 52819b08ed1SBarry Smith 5291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 53019b08ed1SBarry Smith @*/ 531d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 532d71ae5a4SJacob Faibussowitsch { 53319b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 53419b08ed1SBarry Smith 53519b08ed1SBarry Smith PetscFunctionBegin; 5369566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5379566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53819b08ed1SBarry Smith a->maxnz = nztotal; 5394dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 54019b08ed1SBarry Smith if (!a->ilen) { 5419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 54219b08ed1SBarry Smith } else { 5439566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 54419b08ed1SBarry Smith } 54519b08ed1SBarry Smith 54619b08ed1SBarry Smith /* allocate the matrix space */ 5479f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(A->rmap->n + 1, sizeof(PetscInt), (void **)&a->i)); 5489f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscInt), (void **)&a->j)); 5499f0612e4SBarry Smith a->free_ij = PETSC_TRUE; 55019b08ed1SBarry Smith if (A->structure_only) { 55119b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55219b08ed1SBarry Smith } else { 5539f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscScalar), (void **)&a->a)); 55419b08ed1SBarry Smith a->free_a = PETSC_TRUE; 55519b08ed1SBarry Smith } 5569f0612e4SBarry Smith a->i[0] = 0; 55719b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 55819b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 5593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56019b08ed1SBarry Smith } 56119b08ed1SBarry Smith 562ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 563d71ae5a4SJacob Faibussowitsch { 564071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 565071fcb05SBarry Smith PetscInt *rp, k, row; 566071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 567071fcb05SBarry Smith PetscInt *aj = a->j; 568fff043a9SJunchao Zhang MatScalar *aa, *ap; 569071fcb05SBarry Smith 570071fcb05SBarry Smith PetscFunctionBegin; 5719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 572071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 573071fcb05SBarry Smith row = im[k]; 5746bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 575071fcb05SBarry Smith rp = aj + ai[row]; 576071fcb05SBarry Smith ap = aa + ai[row]; 57748a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 578071fcb05SBarry Smith if (!A->structure_only) { 579071fcb05SBarry Smith if (v) { 5809566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 581071fcb05SBarry Smith v += n; 582071fcb05SBarry Smith } else { 5839566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 584071fcb05SBarry Smith } 585071fcb05SBarry Smith } 586071fcb05SBarry Smith ailen[row] = n; 587071fcb05SBarry Smith a->nz += n; 588071fcb05SBarry Smith } 5899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 591071fcb05SBarry Smith } 592071fcb05SBarry Smith 593ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 594d71ae5a4SJacob Faibussowitsch { 5957eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 59697f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59797f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 5984e208921SJed Brown const MatScalar *ap, *aa; 5997eb43aa7SLois Curfman McInnes 6003a40ed3dSBarry Smith PetscFunctionBegin; 6014e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6027eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6037eb43aa7SLois Curfman McInnes row = im[k]; 6049371c9d4SSatish Balay if (row < 0) { 6059371c9d4SSatish Balay v += n; 6069371c9d4SSatish Balay continue; 6079371c9d4SSatish Balay } /* negative row */ 60854c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6098e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 6108e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 6117eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6127eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6139371c9d4SSatish Balay if (in[l] < 0) { 6149371c9d4SSatish Balay v++; 6159371c9d4SSatish Balay continue; 6169371c9d4SSatish Balay } /* negative column */ 61754c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 618bfeeae90SHong Zhang col = in[l]; 6199371c9d4SSatish Balay high = nrow; 6209371c9d4SSatish Balay low = 0; /* assume unsorted */ 6217eb43aa7SLois Curfman McInnes while (high - low > 5) { 6227eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6237eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6247eb43aa7SLois Curfman McInnes else low = t; 6257eb43aa7SLois Curfman McInnes } 6267eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6277eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6287eb43aa7SLois Curfman McInnes if (rp[i] == col) { 629b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6307eb43aa7SLois Curfman McInnes goto finished; 6317eb43aa7SLois Curfman McInnes } 6327eb43aa7SLois Curfman McInnes } 63397e567efSBarry Smith *v++ = 0.0; 6347eb43aa7SLois Curfman McInnes finished:; 6357eb43aa7SLois Curfman McInnes } 6367eb43aa7SLois Curfman McInnes } 6374e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6397eb43aa7SLois Curfman McInnes } 6407eb43aa7SLois Curfman McInnes 641ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 642d71ae5a4SJacob Faibussowitsch { 6433ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 644c898d852SStefano Zampini const PetscScalar *av; 6453ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6463ea6fe3dSLisandro Dalcin PetscInt *rowlens; 64717ab2063SBarry Smith 6483a40ed3dSBarry Smith PetscFunctionBegin; 6499566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6502205254eSKarl Rupp 6513ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6523ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6533ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6543ea6fe3dSLisandro Dalcin nz = A->nz; 655416022c9SBarry Smith 6563ea6fe3dSLisandro Dalcin /* write matrix header */ 6573ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6589371c9d4SSatish Balay header[1] = M; 6599371c9d4SSatish Balay header[2] = N; 6609371c9d4SSatish Balay header[3] = nz; 6619566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 662416022c9SBarry Smith 6633ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6653ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6669566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6679566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6683ea6fe3dSLisandro Dalcin /* store column indices */ 6699566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 670416022c9SBarry Smith /* store nonzero values */ 6719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6729566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 674b37d52dbSMark F. Adams 6753ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6769566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 67817ab2063SBarry Smith } 679416022c9SBarry Smith 680d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 681d71ae5a4SJacob Faibussowitsch { 6827dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6837dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6847dc0baabSHong Zhang 6857dc0baabSHong Zhang PetscFunctionBegin; 6869566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6877dc0baabSHong Zhang for (i = 0; i < m; i++) { 6889566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 68948a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6909566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6917dc0baabSHong Zhang } 6929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6947dc0baabSHong Zhang } 6957dc0baabSHong Zhang 69609573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 697cd155464SBarry Smith 698ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 699d71ae5a4SJacob Faibussowitsch { 700416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 701c898d852SStefano Zampini const PetscScalar *av; 70260e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 703e060cb09SBarry Smith const char *name; 704f3ef73ceSBarry Smith PetscViewerFormat format; 70517ab2063SBarry Smith 7063a40ed3dSBarry Smith PetscFunctionBegin; 7077dc0baabSHong Zhang if (A->structure_only) { 7089566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7107dc0baabSHong Zhang } 71143e49210SHong Zhang 7129566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 713bd6a2ce3SJunchao Zhang // By petsc's rule, even PETSC_VIEWER_ASCII_INFO_DETAIL doesn't print matrix entries 7143ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 7152e5835c6SStefano Zampini 716c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 71971c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 72097f1f81fSBarry Smith PetscInt nofinalvalue = 0; 72160e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 722c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 723d00d2cf4SBarry Smith nofinalvalue = 1; 724d00d2cf4SBarry Smith } 7259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 728fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 730fbfe6fa7SJed Brown #else 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 732fbfe6fa7SJed Brown #endif 7339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73417ab2063SBarry Smith 73517ab2063SBarry Smith for (i = 0; i < m; i++) { 73660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 737aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 73917ab2063SBarry Smith #else 7409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 74117ab2063SBarry Smith #endif 74217ab2063SBarry Smith } 74317ab2063SBarry Smith } 744d00d2cf4SBarry Smith if (nofinalvalue) { 745c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 747c337ccceSJed Brown #else 7489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 749c337ccceSJed Brown #endif 750d00d2cf4SBarry Smith } 7519566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 754fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 75644cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 75860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 759aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 76036db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76236db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76436db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7659566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7666831982aSBarry Smith } 76744cd7ae7SLois Curfman McInnes #else 7689566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 76944cd7ae7SLois Curfman McInnes #endif 77044cd7ae7SLois Curfman McInnes } 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77244cd7ae7SLois Curfman McInnes } 7739566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 774fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 77597f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7779566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 778496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 779496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 78060e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 781496be53dSLois Curfman McInnes if (a->j[j] >= i) { 782aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78336db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 784496be53dSLois Curfman McInnes #else 785496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 786496be53dSLois Curfman McInnes #endif 787496be53dSLois Curfman McInnes } 788496be53dSLois Curfman McInnes } 789496be53dSLois Curfman McInnes } 7902e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7922e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7932205254eSKarl Rupp if (i + 4 < m) { 7949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 7952205254eSKarl Rupp } else if (i + 3 < m) { 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 7972205254eSKarl Rupp } else if (i + 2 < m) { 7989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 7992205254eSKarl Rupp } else if (i + 1 < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 8012205254eSKarl Rupp } else if (i < m) { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8032205254eSKarl Rupp } else { 8049566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8052205254eSKarl Rupp } 806496be53dSLois Curfman McInnes } 8079566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8089566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 809496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81060e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8119566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 812496be53dSLois Curfman McInnes } 8139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 814496be53dSLois Curfman McInnes } 8159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 816496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81760e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 818496be53dSLois Curfman McInnes if (a->j[j] >= i) { 819aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 82048a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 821496be53dSLois Curfman McInnes #else 8229566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 823496be53dSLois Curfman McInnes #endif 824496be53dSLois Curfman McInnes } 825496be53dSLois Curfman McInnes } 8269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 827496be53dSLois Curfman McInnes } 8289566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 829fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 83097f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 83187828ca2SBarry Smith PetscScalar value; 83268f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83368f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83468f1ed48SBarry Smith 83568f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 83668f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 83768f1ed48SBarry Smith realonly = PETSC_FALSE; 83868f1ed48SBarry Smith break; 83968f1ed48SBarry Smith } 84068f1ed48SBarry Smith } 84168f1ed48SBarry Smith #endif 84202594712SBarry Smith 8439566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84402594712SBarry Smith for (i = 0; i < m; i++) { 84502594712SBarry Smith jcnt = 0; 846d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 847e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 84802594712SBarry Smith value = a->a[cnt++]; 849e24b481bSBarry Smith jcnt++; 85002594712SBarry Smith } else { 85102594712SBarry Smith value = 0.0; 85202594712SBarry Smith } 853aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85468f1ed48SBarry Smith if (realonly) { 8559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 85668f1ed48SBarry Smith } else { 8579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 85868f1ed48SBarry Smith } 85902594712SBarry Smith #else 8609566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 86102594712SBarry Smith #endif 86202594712SBarry Smith } 8639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86402594712SBarry Smith } 8659566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8663c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 867150b93efSMatthew G. Knepley PetscInt fshift = 1; 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8693c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8713c215bfdSMatthew Knepley #else 8729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8733c215bfdSMatthew Knepley #endif 8749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8753c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 87660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8773c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8793c215bfdSMatthew Knepley #else 8809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8813c215bfdSMatthew Knepley #endif 8823c215bfdSMatthew Knepley } 8833c215bfdSMatthew Knepley } 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8853a40ed3dSBarry Smith } else { 8869566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 887d5f3da31SBarry Smith if (A->factortype) { 88816cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 89016cd7e1dSShri Abhyankar /* L part */ 89160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89316cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 89516cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 89716cd7e1dSShri Abhyankar } else { 8989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 89916cd7e1dSShri Abhyankar } 90016cd7e1dSShri Abhyankar #else 9019566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90216cd7e1dSShri Abhyankar #endif 90316cd7e1dSShri Abhyankar } 90416cd7e1dSShri Abhyankar /* diagonal */ 90516cd7e1dSShri Abhyankar j = a->diag[i]; 90616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 90716cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 908835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1 / a->a[j]), (double)PetscImaginaryPart(1 / a->a[j]))); 90916cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 910835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1 / a->a[j]), (double)(-PetscImaginaryPart(1 / a->a[j])))); 91116cd7e1dSShri Abhyankar } else { 912835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1 / a->a[j]))); 91316cd7e1dSShri Abhyankar } 91416cd7e1dSShri Abhyankar #else 915835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1 / a->a[j]))); 91616cd7e1dSShri Abhyankar #endif 91716cd7e1dSShri Abhyankar 91816cd7e1dSShri Abhyankar /* U part */ 91960e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 92016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 92116cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9229566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92316cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 92516cd7e1dSShri Abhyankar } else { 9269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 92716cd7e1dSShri Abhyankar } 92816cd7e1dSShri Abhyankar #else 9299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 93016cd7e1dSShri Abhyankar #endif 93116cd7e1dSShri Abhyankar } 9329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93316cd7e1dSShri Abhyankar } 93416cd7e1dSShri Abhyankar } else { 93517ab2063SBarry Smith for (i = 0; i < m; i++) { 9369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 93760e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 938aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 93936db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 94136db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9433a40ed3dSBarry Smith } else { 9449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 94517ab2063SBarry Smith } 94617ab2063SBarry Smith #else 9479566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 94817ab2063SBarry Smith #endif 94917ab2063SBarry Smith } 9509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 95117ab2063SBarry Smith } 95216cd7e1dSShri Abhyankar } 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95417ab2063SBarry Smith } 9559566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 957416022c9SBarry Smith } 958416022c9SBarry Smith 9599804daf3SBarry Smith #include <petscdraw.h> 960ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 961d71ae5a4SJacob Faibussowitsch { 962480ef9eaSBarry Smith Mat A = (Mat)Aa; 963416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 964383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 965383922c3SLisandro Dalcin int color; 966b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 967b0a32e0cSBarry Smith PetscViewer viewer; 968f3ef73ceSBarry Smith PetscViewerFormat format; 969fff043a9SJunchao Zhang const PetscScalar *aa; 970cddf8d76SBarry Smith 9713a40ed3dSBarry Smith PetscFunctionBegin; 9729566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9739566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9749566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 975383922c3SLisandro Dalcin 976416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 978fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 979d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9800513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 981b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 982416022c9SBarry Smith for (i = 0; i < m; i++) { 9839371c9d4SSatish Balay y_l = m - i - 1.0; 9849371c9d4SSatish Balay y_r = y_l + 1.0; 985bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9869371c9d4SSatish Balay x_l = a->j[j]; 9879371c9d4SSatish Balay x_r = x_l + 1.0; 988fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9899566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 990cddf8d76SBarry Smith } 991cddf8d76SBarry Smith } 992b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 993cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9949371c9d4SSatish Balay y_l = m - i - 1.0; 9959371c9d4SSatish Balay y_r = y_l + 1.0; 996bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9979371c9d4SSatish Balay x_l = a->j[j]; 9989371c9d4SSatish Balay x_r = x_l + 1.0; 999fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10009566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1001cddf8d76SBarry Smith } 1002cddf8d76SBarry Smith } 1003b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1004cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10059371c9d4SSatish Balay y_l = m - i - 1.0; 10069371c9d4SSatish Balay y_r = y_l + 1.0; 1007bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10089371c9d4SSatish Balay x_l = a->j[j]; 10099371c9d4SSatish Balay x_r = x_l + 1.0; 1010fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10119566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1012416022c9SBarry Smith } 1013416022c9SBarry Smith } 1014d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10150513a670SBarry Smith } else { 10160513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10170513a670SBarry Smith /* first determine max of all nonzero values */ 1018b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1019383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1020b0a32e0cSBarry Smith PetscDraw popup; 10210513a670SBarry Smith 10220513a670SBarry Smith for (i = 0; i < nz; i++) { 1023fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10240513a670SBarry Smith } 1025383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10269566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10279566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1028383922c3SLisandro Dalcin 1029d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10300513a670SBarry Smith for (i = 0; i < m; i++) { 1031383922c3SLisandro Dalcin y_l = m - i - 1.0; 1032383922c3SLisandro Dalcin y_r = y_l + 1.0; 1033bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1034383922c3SLisandro Dalcin x_l = a->j[j]; 1035383922c3SLisandro Dalcin x_r = x_l + 1.0; 1036fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10379566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10380513a670SBarry Smith count++; 10390513a670SBarry Smith } 10400513a670SBarry Smith } 1041d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10420513a670SBarry Smith } 10439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 10443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1045480ef9eaSBarry Smith } 1046cddf8d76SBarry Smith 10479804daf3SBarry Smith #include <petscdraw.h> 1048ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1049d71ae5a4SJacob Faibussowitsch { 1050b0a32e0cSBarry Smith PetscDraw draw; 105136db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1052ace3abfcSBarry Smith PetscBool isnull; 1053480ef9eaSBarry Smith 1054480ef9eaSBarry Smith PetscFunctionBegin; 10559566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10569566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 10573ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 1058480ef9eaSBarry Smith 10599371c9d4SSatish Balay xr = A->cmap->n; 10609371c9d4SSatish Balay yr = A->rmap->n; 10619371c9d4SSatish Balay h = yr / 10.0; 10629371c9d4SSatish Balay w = xr / 10.0; 10639371c9d4SSatish Balay xr += w; 10649371c9d4SSatish Balay yr += h; 10659371c9d4SSatish Balay xl = -w; 10669371c9d4SSatish Balay yl = -h; 10679566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10689566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10699566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10709566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10719566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1073416022c9SBarry Smith } 1074416022c9SBarry Smith 1075d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1076d71ae5a4SJacob Faibussowitsch { 1077ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1078416022c9SBarry Smith 10793a40ed3dSBarry Smith PetscFunctionBegin; 10809566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10819566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10829566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10831baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10841baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10851baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10869566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 108817ab2063SBarry Smith } 108919bcc07fSBarry Smith 1090d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1091d71ae5a4SJacob Faibussowitsch { 1092416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1093580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1094bc43efbbSJunchao Zhang PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0, n; 109554f21887SBarry Smith MatScalar *aa = a->a, *ap; 10963447b6efSHong Zhang PetscReal ratio = 0.6; 109717ab2063SBarry Smith 10983a40ed3dSBarry Smith PetscFunctionBegin; 10993ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 11009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1101b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1102b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11039566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1105b215bc84SStefano Zampini } 110617ab2063SBarry Smith 110743ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 110817ab2063SBarry Smith for (i = 1; i < m; i++) { 1109416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 111017ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 111194a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111217ab2063SBarry Smith if (fshift) { 1113bfeeae90SHong Zhang ip = aj + ai[i]; 1114bfeeae90SHong Zhang ap = aa + ai[i]; 111517ab2063SBarry Smith N = ailen[i]; 11169566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 111748a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 111817ab2063SBarry Smith } 111917ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 112017ab2063SBarry Smith } 112117ab2063SBarry Smith if (m) { 112217ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112317ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112417ab2063SBarry Smith } 112517ab2063SBarry Smith /* reset ilen and imax for each row */ 11267b083b7cSBarry Smith a->nonzerorowcnt = 0; 1127396832f4SHong Zhang if (A->structure_only) { 11289566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11299566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1130396832f4SHong Zhang } else { /* !A->structure_only */ 113117ab2063SBarry Smith for (i = 0; i < m; i++) { 113217ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11337b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113417ab2063SBarry Smith } 1135396832f4SHong Zhang } 1136bfeeae90SHong Zhang a->nz = ai[m]; 1137aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 1138bc43efbbSJunchao Zhang PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly 1139bc43efbbSJunchao Zhang a->diagonaldense = PETSC_TRUE; 1140bc43efbbSJunchao Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1141bc43efbbSJunchao Zhang for (i = 0; i < n; i++) { 1142bc43efbbSJunchao Zhang if (a->diag[i] >= ai[i + 1]) { 1143bc43efbbSJunchao Zhang a->diagonaldense = PETSC_FALSE; 1144bc43efbbSJunchao Zhang break; 1145bc43efbbSJunchao Zhang } 1146bc43efbbSJunchao Zhang } 11479566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11489566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11499566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11502205254eSKarl Rupp 11518e58a170SBarry Smith A->info.mallocs += a->reallocs; 1152dd5f02e7SSatish Balay a->reallocs = 0; 11536712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 115436db0b34SBarry Smith a->rmax = rmax; 11554e220ebcSLois Curfman McInnes 115648a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11579566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 115917ab2063SBarry Smith } 116017ab2063SBarry Smith 1161ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1162d71ae5a4SJacob Faibussowitsch { 116399cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 116499cafbc1SBarry Smith PetscInt i, nz = a->nz; 11652e5835c6SStefano Zampini MatScalar *aa; 116699cafbc1SBarry Smith 116799cafbc1SBarry Smith PetscFunctionBegin; 11689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 116999cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 117399cafbc1SBarry Smith } 117499cafbc1SBarry Smith 1175ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1176d71ae5a4SJacob Faibussowitsch { 117799cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 117899cafbc1SBarry Smith PetscInt i, nz = a->nz; 11792e5835c6SStefano Zampini MatScalar *aa; 118099cafbc1SBarry Smith 118199cafbc1SBarry Smith PetscFunctionBegin; 11829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 118399cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 118799cafbc1SBarry Smith } 118899cafbc1SBarry Smith 1189d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1190d71ae5a4SJacob Faibussowitsch { 1191fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1192fff043a9SJunchao Zhang MatScalar *aa; 11933a40ed3dSBarry Smith 11943a40ed3dSBarry Smith PetscFunctionBegin; 11959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 11969566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 11979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 11989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 120017ab2063SBarry Smith } 1201416022c9SBarry Smith 1202674b392bSAlexander static PetscErrorCode MatReset_SeqAIJ(Mat A) 1203d71ae5a4SJacob Faibussowitsch { 1204416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1205d5d45c9bSBarry Smith 12063a40ed3dSBarry Smith PetscFunctionBegin; 1207b4e2f619SBarry Smith if (A->hash_active) { 1208e3c72094SPierre Jolivet A->ops[0] = a->cops; 1209b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 1210b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 1211b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 1212b4e2f619SBarry Smith } 1213b4e2f619SBarry Smith 12143ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz)); 12159566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12169566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12179566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12189566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12199566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12209566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12219566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12229566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12239566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12259566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12269566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12289566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 1229674b392bSAlexander PetscFunctionReturn(PETSC_SUCCESS); 1230674b392bSAlexander } 1231674b392bSAlexander 1232674b392bSAlexander static PetscErrorCode MatResetHash_SeqAIJ(Mat A) 1233674b392bSAlexander { 1234674b392bSAlexander PetscFunctionBegin; 1235674b392bSAlexander PetscCall(MatReset_SeqAIJ(A)); 1236674b392bSAlexander PetscCall(MatCreate_SeqAIJ_Inode(A)); 1237674b392bSAlexander PetscCall(MatSetUp_Seq_Hash(A)); 1238674b392bSAlexander A->nonzerostate++; 1239674b392bSAlexander PetscFunctionReturn(PETSC_SUCCESS); 1240674b392bSAlexander } 1241674b392bSAlexander 1242674b392bSAlexander PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1243674b392bSAlexander { 1244674b392bSAlexander PetscFunctionBegin; 1245674b392bSAlexander PetscCall(MatReset_SeqAIJ(A)); 12469566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1247901853e0SKris Buschelman 12486718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12496718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12506718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12516718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12526718818eSStefano Zampini due to different matrix sizes */ 12539566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12546718818eSStefano Zampini 12559566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12562e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12572e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12642e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12652e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12662e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12672e956fe4SStefano Zampini #endif 12684222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12724222ddf1SHong Zhang #endif 1273d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 1274d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL)); 1275d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL)); 1276d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL)); 1277d5e393b6SSuyash Tandon #endif 12783d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12803d0639e7SStefano Zampini #endif 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1282af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1284af8000cdSHong Zhang #endif 1285d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1287d24d4204SJose E. Roman #endif 128863c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 129163c07aadSStefano Zampini #endif 12929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12962e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12989566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 1299674b392bSAlexander PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetHash_C", NULL)); 13009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 13019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 13029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 13039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 13049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 13059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 13069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 13079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 13082e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 13092e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 13102e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 13112e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 13122e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 13132e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 13142e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 13153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 131617ab2063SBarry Smith } 131717ab2063SBarry Smith 1318d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1319d71ae5a4SJacob Faibussowitsch { 1320416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13213a40ed3dSBarry Smith 13223a40ed3dSBarry Smith PetscFunctionBegin; 1323a65d3064SKris Buschelman switch (op) { 1324d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1325d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1326d71ae5a4SJacob Faibussowitsch break; 1327d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1328d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1329d71ae5a4SJacob Faibussowitsch break; 1330d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1331d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1332d71ae5a4SJacob Faibussowitsch break; 1333d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1334d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1335d71ae5a4SJacob Faibussowitsch break; 1336d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1337d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1338d71ae5a4SJacob Faibussowitsch break; 1339d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1340d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1341d71ae5a4SJacob Faibussowitsch break; 1342d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1343d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1344d71ae5a4SJacob Faibussowitsch break; 13453d472b54SHong Zhang case MAT_SPD: 1346b1646e73SJed Brown case MAT_SYMMETRIC: 1347b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1348b1646e73SJed Brown case MAT_HERMITIAN: 1349b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1350957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1351b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1352b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1353b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13545021d80fSJed Brown break; 13558c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1356a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1357d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1358d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1359d71ae5a4SJacob Faibussowitsch break; 1360d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1361d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1362d71ae5a4SJacob Faibussowitsch break; 1363d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1364d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1365d71ae5a4SJacob Faibussowitsch break; 1366071fcb05SBarry Smith case MAT_SORTED_FULL: 1367071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1368071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1369071fcb05SBarry Smith break; 1370d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1371d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1372d71ae5a4SJacob Faibussowitsch break; 1373d71ae5a4SJacob Faibussowitsch default: 1374d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1375a65d3064SKris Buschelman } 13763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 137717ab2063SBarry Smith } 137817ab2063SBarry Smith 1379ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1380d71ae5a4SJacob Faibussowitsch { 1381416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1382fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1383c898d852SStefano Zampini PetscScalar *x; 1384c898d852SStefano Zampini const PetscScalar *aa; 138517ab2063SBarry Smith 13863a40ed3dSBarry Smith PetscFunctionBegin; 13879566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 138808401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1390d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1391d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13929566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13932c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13949566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 139735e7444dSHong Zhang } 139835e7444dSHong Zhang 13999566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 140035e7444dSHong Zhang for (i = 0; i < n; i++) { 1401fdc842d1SBarry Smith x[i] = 0.0; 140235e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 140335e7444dSHong Zhang if (aj[j] == i) { 140435e7444dSHong Zhang x[i] = aa[j]; 140517ab2063SBarry Smith break; 140617ab2063SBarry Smith } 140717ab2063SBarry Smith } 140817ab2063SBarry Smith } 14099566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 14109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 141217ab2063SBarry Smith } 141317ab2063SBarry Smith 1414c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1415d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1416d71ae5a4SJacob Faibussowitsch { 1417416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 14185f22a7b3SSebastian Grimberg const MatScalar *aa; 1419d9ca1df4SBarry Smith PetscScalar *y; 1420d9ca1df4SBarry Smith const PetscScalar *x; 1421d0f46423SBarry Smith PetscInt m = A->rmap->n; 14225c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14235f22a7b3SSebastian Grimberg const MatScalar *v; 1424a77337e4SBarry Smith PetscScalar alpha; 1425d9ca1df4SBarry Smith PetscInt n, i, j; 1426d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14273447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1428ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14295c897100SBarry Smith #endif 143017ab2063SBarry Smith 14313a40ed3dSBarry Smith PetscFunctionBegin; 14329566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14339566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14349566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14365c897100SBarry Smith 14375c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1438fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14395c897100SBarry Smith #else 14403447b6efSHong Zhang if (usecprow) { 14413447b6efSHong Zhang m = cprow.nrows; 14423447b6efSHong Zhang ii = cprow.i; 14437b2bb3b9SHong Zhang ridx = cprow.rindex; 14443447b6efSHong Zhang } else { 14453447b6efSHong Zhang ii = a->i; 14463447b6efSHong Zhang } 144717ab2063SBarry Smith for (i = 0; i < m; i++) { 14483447b6efSHong Zhang idx = a->j + ii[i]; 1449fff043a9SJunchao Zhang v = aa + ii[i]; 14503447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14513447b6efSHong Zhang if (usecprow) { 14527b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14533447b6efSHong Zhang } else { 145417ab2063SBarry Smith alpha = x[i]; 14553447b6efSHong Zhang } 145604fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 145717ab2063SBarry Smith } 14585c897100SBarry Smith #endif 14599566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14609566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14619566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 146417ab2063SBarry Smith } 146517ab2063SBarry Smith 1466d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1467d71ae5a4SJacob Faibussowitsch { 14685c897100SBarry Smith PetscFunctionBegin; 14699566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14709566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14725c897100SBarry Smith } 14735c897100SBarry Smith 1474c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 147578b84d54SShri Abhyankar 1476d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1477d71ae5a4SJacob Faibussowitsch { 1478416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1479d9fead3dSBarry Smith PetscScalar *y; 148054f21887SBarry Smith const PetscScalar *x; 14815914357eSBarry Smith const MatScalar *a_a; 1482003131ecSBarry Smith PetscInt m = A->rmap->n; 14835914357eSBarry Smith const PetscInt *ii, *ridx = NULL; 1484ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 148517ab2063SBarry Smith 1486b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 148797952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1488fee21e36SBarry Smith #endif 1489fee21e36SBarry Smith 14903a40ed3dSBarry Smith PetscFunctionBegin; 1491b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14929566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 14933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1494b215bc84SStefano Zampini } 14959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14969566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14979566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1498416022c9SBarry Smith ii = a->i; 14994eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 15009566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 150197952fefSHong Zhang m = a->compressedrow.nrows; 150297952fefSHong Zhang ii = a->compressedrow.i; 150397952fefSHong Zhang ridx = a->compressedrow.rindex; 15045914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 15055914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 15065914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 15075914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 15085914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 15095914357eSBarry Smith PetscScalar sum = 0.0; 1510003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1511003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 151297952fefSHong Zhang y[*ridx++] = sum; 151397952fefSHong Zhang } 151497952fefSHong Zhang } else { /* do not use compressed row format */ 1515b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 15165914357eSBarry Smith fortranmultaij_(&m, x, ii, a->j, a_a, y); 1517b05257ddSBarry Smith #else 15185914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 15195914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 15205914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 15215914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 15225914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 15235914357eSBarry Smith PetscScalar sum = 0.0; 1524003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 152517ab2063SBarry Smith y[i] = sum; 152617ab2063SBarry Smith } 15278d195f9aSBarry Smith #endif 1528b05257ddSBarry Smith } 15299566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15309566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15319566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 153417ab2063SBarry Smith } 153517ab2063SBarry Smith 1536ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1537ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1538d71ae5a4SJacob Faibussowitsch { 1539b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1540b434eb95SMatthew G. Knepley PetscScalar *y; 1541b434eb95SMatthew G. Knepley const PetscScalar *x; 1542fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1543b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1544b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1545b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1546b434eb95SMatthew G. Knepley PetscScalar sum; 1547b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1548b434eb95SMatthew G. Knepley 1549b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1550b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1551b434eb95SMatthew G. Knepley #endif 1552b434eb95SMatthew G. Knepley 1553b434eb95SMatthew G. Knepley PetscFunctionBegin; 15549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15559566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15569566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1557b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1558b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1559b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1560b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1561b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1562b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1563b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1564fff043a9SJunchao Zhang aa = a_a + ii[i]; 1565b434eb95SMatthew G. Knepley sum = 0.0; 1566b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1567b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1568b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1569b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1570b434eb95SMatthew G. Knepley } 1571b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15723d3eaba7SBarry Smith ii = a->i; 1573b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1574b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1575b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1576fff043a9SJunchao Zhang aa = a_a + ii[i]; 1577b434eb95SMatthew G. Knepley sum = 0.0; 1578b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1579b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1580b434eb95SMatthew G. Knepley y[i] = sum; 1581b434eb95SMatthew G. Knepley } 1582b434eb95SMatthew G. Knepley } 15839566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15849566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15859566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1588b434eb95SMatthew G. Knepley } 1589b434eb95SMatthew G. Knepley 1590ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1591ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1592d71ae5a4SJacob Faibussowitsch { 1593b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1594b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1595b434eb95SMatthew G. Knepley const PetscScalar *x; 1596fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1597b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1598b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1599b434eb95SMatthew G. Knepley PetscScalar sum; 1600b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1601b434eb95SMatthew G. Knepley 1602b434eb95SMatthew G. Knepley PetscFunctionBegin; 16039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16049566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16059566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1606b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 160748a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1608b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1609b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1610b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1611b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1612b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1613b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1614fff043a9SJunchao Zhang aa = a_a + ii[i]; 1615b434eb95SMatthew G. Knepley sum = y[*ridx]; 1616b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1617b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1618b434eb95SMatthew G. Knepley } 1619b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16203d3eaba7SBarry Smith ii = a->i; 1621b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1622b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1623b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1624fff043a9SJunchao Zhang aa = a_a + ii[i]; 1625b434eb95SMatthew G. Knepley sum = y[i]; 1626b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1627b434eb95SMatthew G. Knepley z[i] = sum; 1628b434eb95SMatthew G. Knepley } 1629b434eb95SMatthew G. Knepley } 16309566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16319566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16329566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1635b434eb95SMatthew G. Knepley } 1636b434eb95SMatthew G. Knepley 1637c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1638d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1639d71ae5a4SJacob Faibussowitsch { 1640416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1641f15663dcSBarry Smith PetscScalar *y, *z; 1642f15663dcSBarry Smith const PetscScalar *x; 16435914357eSBarry Smith const MatScalar *a_a; 16445914357eSBarry Smith const PetscInt *ii, *ridx = NULL; 16455914357eSBarry Smith PetscInt m = A->rmap->n; 1646ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16479ea0dfa2SSatish Balay 16483a40ed3dSBarry Smith PetscFunctionBegin; 1649b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16509566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 16513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1652b215bc84SStefano Zampini } 16539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16549566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16559566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16564eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 165748a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 165897952fefSHong Zhang m = a->compressedrow.nrows; 165997952fefSHong Zhang ii = a->compressedrow.i; 166097952fefSHong Zhang ridx = a->compressedrow.rindex; 16615914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 16625914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 16635914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 16645914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 16655914357eSBarry Smith PetscScalar sum = y[*ridx]; 1666f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 166797952fefSHong Zhang z[*ridx++] = sum; 166897952fefSHong Zhang } 166997952fefSHong Zhang } else { /* do not use compressed row format */ 16703d3eaba7SBarry Smith ii = a->i; 1671f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16725914357eSBarry Smith fortranmultaddaij_(&m, x, ii, a->j, a_a, y, z); 1673f15663dcSBarry Smith #else 16745914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 16755914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 16765914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 16775914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 16785914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 16795914357eSBarry Smith PetscScalar sum = y[i]; 1680f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 168117ab2063SBarry Smith z[i] = sum; 168217ab2063SBarry Smith } 168302ab625aSSatish Balay #endif 1684f15663dcSBarry Smith } 16859566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16869566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 169017ab2063SBarry Smith } 169117ab2063SBarry Smith 169217ab2063SBarry Smith /* 169317ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 169417ab2063SBarry Smith */ 1695d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1696d71ae5a4SJacob Faibussowitsch { 1697416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1698d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1699c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 170017ab2063SBarry Smith 17013a40ed3dSBarry Smith PetscFunctionBegin; 170209f38230SBarry Smith if (!a->diag) { 17039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1704c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 170509f38230SBarry Smith } 1706d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1707c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1708c0c07093SJunchao Zhang if (alreadySet) { 1709c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1710c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1711c0c07093SJunchao Zhang } 1712c0c07093SJunchao Zhang 171309f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1714bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1715bfeeae90SHong Zhang if (a->j[j] == i) { 171609f38230SBarry Smith a->diag[i] = j; 171717ab2063SBarry Smith break; 171817ab2063SBarry Smith } 171917ab2063SBarry Smith } 172017ab2063SBarry Smith } 17213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 172217ab2063SBarry Smith } 172317ab2063SBarry Smith 1724ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1725d71ae5a4SJacob Faibussowitsch { 172661ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 172761ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 172861ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 172961ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 173061ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 173161ecd0c6SBarry Smith 173261ecd0c6SBarry Smith PetscFunctionBegin; 173361ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17359566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 17363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 173761ecd0c6SBarry Smith } 173861ecd0c6SBarry Smith 173961ecd0c6SBarry Smith if (a->diagonaldense) { 174061ecd0c6SBarry Smith cnt = 0; 174161ecd0c6SBarry Smith } else { 17429566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 174361ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1744349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 174561ecd0c6SBarry Smith cnt++; 174661ecd0c6SBarry Smith mdiag[i] = 1; 174761ecd0c6SBarry Smith } 174861ecd0c6SBarry Smith } 174961ecd0c6SBarry Smith } 175061ecd0c6SBarry Smith if (!cnt) { 17519566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 175261ecd0c6SBarry Smith } else { 1753b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1754b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 17559f0612e4SBarry Smith PetscBool free_a = a->free_a, free_ij = a->free_ij; 17566ea2a7edSJunchao Zhang const PetscScalar *Aa; 17576ea2a7edSJunchao Zhang 17586ea2a7edSJunchao Zhang PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host 17596ea2a7edSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa)); 176061ecd0c6SBarry Smith 176161ecd0c6SBarry Smith a->a = NULL; 176261ecd0c6SBarry Smith a->j = NULL; 176361ecd0c6SBarry Smith a->i = NULL; 176461ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1765ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 176761ecd0c6SBarry Smith 176861ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 176961ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17709566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 177148a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1772447d62f5SStefano Zampini } 17739566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17749566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 17759f0612e4SBarry Smith if (free_a) PetscCall(PetscShmgetDeallocateArray((void **)&olda)); 17769f0612e4SBarry Smith if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldj)); 17779f0612e4SBarry Smith if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldi)); 177861ecd0c6SBarry Smith } 17799566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 178061ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 17813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 178261ecd0c6SBarry Smith } 178361ecd0c6SBarry Smith 1784be5855fcSBarry Smith /* 1785be5855fcSBarry Smith Checks for missing diagonals 1786be5855fcSBarry Smith */ 1787d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1788d71ae5a4SJacob Faibussowitsch { 1789be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17907734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1791be5855fcSBarry Smith 1792be5855fcSBarry Smith PetscFunctionBegin; 179309f38230SBarry Smith *missing = PETSC_FALSE; 17947734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 179509f38230SBarry Smith *missing = PETSC_TRUE; 179609f38230SBarry Smith if (d) *d = 0; 17979566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 179809f38230SBarry Smith } else { 179901445905SHong Zhang PetscInt n; 180001445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1801f1e2ffcdSBarry Smith diag = a->diag; 180201445905SHong Zhang for (i = 0; i < n; i++) { 18037734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 180409f38230SBarry Smith *missing = PETSC_TRUE; 180509f38230SBarry Smith if (d) *d = i; 18069566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1807358d2f5dSShri Abhyankar break; 180809f38230SBarry Smith } 1809be5855fcSBarry Smith } 1810be5855fcSBarry Smith } 18113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1812be5855fcSBarry Smith } 1813be5855fcSBarry Smith 18140da83c2eSBarry Smith #include <petscblaslapack.h> 18150da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18160da83c2eSBarry Smith 18170da83c2eSBarry Smith /* 18180da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18190da83c2eSBarry Smith */ 1820ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1821d71ae5a4SJacob Faibussowitsch { 18220da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18230da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18240da83c2eSBarry Smith const PetscReal shift = 0.0; 18250da83c2eSBarry Smith PetscInt ipvt[5]; 18264e208921SJed Brown PetscCount flops = 0; 18270da83c2eSBarry Smith PetscScalar work[25], *v_work; 18280da83c2eSBarry Smith 18290da83c2eSBarry Smith PetscFunctionBegin; 18300da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18310da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 183208401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1833ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18349566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 183548a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18360da83c2eSBarry Smith ncnt = 0; 18370da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18380da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18399566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18400da83c2eSBarry Smith switch (bsizes[i]) { 1841d71ae5a4SJacob Faibussowitsch case 1: 1842d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1843d71ae5a4SJacob Faibussowitsch break; 18440da83c2eSBarry Smith case 2: 18459566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18460da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18480da83c2eSBarry Smith break; 18490da83c2eSBarry Smith case 3: 18509566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18510da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18529566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18530da83c2eSBarry Smith break; 18540da83c2eSBarry Smith case 4: 18559566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18560da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18579566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18580da83c2eSBarry Smith break; 18590da83c2eSBarry Smith case 5: 18609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18610da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18630da83c2eSBarry Smith break; 18640da83c2eSBarry Smith case 6: 18659566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18660da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18679566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18680da83c2eSBarry Smith break; 18690da83c2eSBarry Smith case 7: 18709566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18710da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18729566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18730da83c2eSBarry Smith break; 18740da83c2eSBarry Smith default: 18759566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18760da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18779566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18780da83c2eSBarry Smith } 18790da83c2eSBarry Smith ncnt += bsizes[i]; 18800da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 1881baa50dc0SBrad Aagaard flops += 2 * PetscPowInt64(bsizes[i], 3) / 3; 18820da83c2eSBarry Smith } 18833ba16761SJacob Faibussowitsch PetscCall(PetscLogFlops(flops)); 188448a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18859566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18870da83c2eSBarry Smith } 18880da83c2eSBarry Smith 1889422a814eSBarry Smith /* 1890422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1891422a814eSBarry Smith */ 1892ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1893d71ae5a4SJacob Faibussowitsch { 189471f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1895d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18962e5835c6SStefano Zampini const MatScalar *v; 189754f21887SBarry Smith PetscScalar *idiag, *mdiag; 189871f1c65dSBarry Smith 189971f1c65dSBarry Smith PetscFunctionBegin; 19003ba16761SJacob Faibussowitsch if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS); 19019566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 190271f1c65dSBarry Smith diag = a->diag; 19034dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 19042e5835c6SStefano Zampini 190571f1c65dSBarry Smith mdiag = a->mdiag; 190671f1c65dSBarry Smith idiag = a->idiag; 19079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1908422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 190971f1c65dSBarry Smith for (i = 0; i < m; i++) { 191071f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1911899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1912899639b0SHong Zhang if (PetscRealPart(fshift)) { 19139566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 19147b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 19157b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19167b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 191798921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1918899639b0SHong Zhang } 191971f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 192071f1c65dSBarry Smith } 19219566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 192271f1c65dSBarry Smith } else { 192371f1c65dSBarry Smith for (i = 0; i < m; i++) { 192471f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 192571f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 192671f1c65dSBarry Smith } 19279566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 192871f1c65dSBarry Smith } 192971f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 19313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 193271f1c65dSBarry Smith } 193371f1c65dSBarry Smith 1934d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1935d71ae5a4SJacob Faibussowitsch { 1936416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1937e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19382e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 193954f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19403d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 194197f1f81fSBarry Smith const PetscInt *idx, *diag; 194217ab2063SBarry Smith 19433a40ed3dSBarry Smith PetscFunctionBegin; 1944b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19459566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 19463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1947b215bc84SStefano Zampini } 1948b965ef7fSBarry Smith its = its * lits; 194991723122SBarry Smith 195071f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19519566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 195271f1c65dSBarry Smith a->fshift = fshift; 195371f1c65dSBarry Smith a->omega = omega; 1954ed480e8bSBarry Smith 195571f1c65dSBarry Smith diag = a->diag; 195671f1c65dSBarry Smith t = a->ssor_work; 1957ed480e8bSBarry Smith idiag = a->idiag; 195871f1c65dSBarry Smith mdiag = a->mdiag; 1959ed480e8bSBarry Smith 19609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19619566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19629566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1963ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 196417ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 196517ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1966ed480e8bSBarry Smith bs = b; 196717ab2063SBarry Smith for (i = 0; i < m; i++) { 196871f1c65dSBarry Smith d = fshift + mdiag[i]; 1969416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1970ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19712e5835c6SStefano Zampini v = aa + diag[i] + 1; 197217ab2063SBarry Smith sum = b[i] * d / omega; 1973003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 197417ab2063SBarry Smith x[i] = sum; 197517ab2063SBarry Smith } 19769566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19779566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19799566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 198117ab2063SBarry Smith } 1982c783ea89SBarry Smith 198308401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1984f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19854c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1986887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 198717ab2063SBarry Smith 198817ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 198917ab2063SBarry Smith 1990887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 199117ab2063SBarry Smith */ 199217ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 199317ab2063SBarry Smith 199417ab2063SBarry Smith /* x = (E + U)^{-1} b */ 199517ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1996416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1997ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19982e5835c6SStefano Zampini v = aa + diag[i] + 1; 199917ab2063SBarry Smith sum = b[i]; 2000e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2001ed480e8bSBarry Smith x[i] = sum * idiag[i]; 200217ab2063SBarry Smith } 200317ab2063SBarry Smith 200417ab2063SBarry Smith /* t = b - (2*E - D)x */ 20052e5835c6SStefano Zampini v = aa; 20062205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 200717ab2063SBarry Smith 200817ab2063SBarry Smith /* t = (E + L)^{-1}t */ 2009ed480e8bSBarry Smith ts = t; 2010416022c9SBarry Smith diag = a->diag; 201117ab2063SBarry Smith for (i = 0; i < m; i++) { 2012416022c9SBarry Smith n = diag[i] - a->i[i]; 2013ed480e8bSBarry Smith idx = a->j + a->i[i]; 20142e5835c6SStefano Zampini v = aa + a->i[i]; 201517ab2063SBarry Smith sum = t[i]; 2016003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 2017ed480e8bSBarry Smith t[i] = sum * idiag[i]; 2018733d66baSBarry Smith /* x = x + t */ 2019733d66baSBarry Smith x[i] += t[i]; 202017ab2063SBarry Smith } 202117ab2063SBarry Smith 20229566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20239566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20249566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 202617ab2063SBarry Smith } 202717ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 202817ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 202917ab2063SBarry Smith for (i = 0; i < m; i++) { 2030416022c9SBarry Smith n = diag[i] - a->i[i]; 2031ed480e8bSBarry Smith idx = a->j + a->i[i]; 20322e5835c6SStefano Zampini v = aa + a->i[i]; 203317ab2063SBarry Smith sum = b[i]; 2034e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20355c99c7daSBarry Smith t[i] = sum; 2036ed480e8bSBarry Smith x[i] = sum * idiag[i]; 203717ab2063SBarry Smith } 20385c99c7daSBarry Smith xb = t; 20399566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20403a40ed3dSBarry Smith } else xb = b; 204117ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 204217ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2043416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2044ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20452e5835c6SStefano Zampini v = aa + diag[i] + 1; 204617ab2063SBarry Smith sum = xb[i]; 2047e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20485c99c7daSBarry Smith if (xb == b) { 2049ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20505c99c7daSBarry Smith } else { 2051b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 205217ab2063SBarry Smith } 20535c99c7daSBarry Smith } 20549566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 205517ab2063SBarry Smith } 205617ab2063SBarry Smith its--; 205717ab2063SBarry Smith } 205817ab2063SBarry Smith while (its--) { 205917ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 206017ab2063SBarry Smith for (i = 0; i < m; i++) { 2061b19a5dc2SMark Adams /* lower */ 2062b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2063ed480e8bSBarry Smith idx = a->j + a->i[i]; 20642e5835c6SStefano Zampini v = aa + a->i[i]; 206517ab2063SBarry Smith sum = b[i]; 2066e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2067b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2068b19a5dc2SMark Adams /* upper */ 2069b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2070b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20712e5835c6SStefano Zampini v = aa + diag[i] + 1; 2072b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2073b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 207417ab2063SBarry Smith } 2075b19a5dc2SMark Adams xb = t; 20769566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2077b19a5dc2SMark Adams } else xb = b; 207817ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 207917ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2080b19a5dc2SMark Adams sum = xb[i]; 2081b19a5dc2SMark Adams if (xb == b) { 2082b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2083416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2084ed480e8bSBarry Smith idx = a->j + a->i[i]; 20852e5835c6SStefano Zampini v = aa + a->i[i]; 2086e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2087ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2088b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2089b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2090b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20912e5835c6SStefano Zampini v = aa + diag[i] + 1; 2092b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2093b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 209417ab2063SBarry Smith } 2095b19a5dc2SMark Adams } 2096b19a5dc2SMark Adams if (xb == b) { 20979566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2098b19a5dc2SMark Adams } else { 20999566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2100b19a5dc2SMark Adams } 210117ab2063SBarry Smith } 210217ab2063SBarry Smith } 21039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 21049566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 21059566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 21063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 210717ab2063SBarry Smith } 210817ab2063SBarry Smith 2109ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2110d71ae5a4SJacob Faibussowitsch { 2111416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21124e220ebcSLois Curfman McInnes 21133a40ed3dSBarry Smith PetscFunctionBegin; 21144e220ebcSLois Curfman McInnes info->block_size = 1.0; 21153966268fSBarry Smith info->nz_allocated = a->maxnz; 21163966268fSBarry Smith info->nz_used = a->nz; 21173966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21183966268fSBarry Smith info->assemblies = A->num_ass; 21193966268fSBarry Smith info->mallocs = A->info.mallocs; 21204dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2121d5f3da31SBarry Smith if (A->factortype) { 21224e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21234e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21244e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21254e220ebcSLois Curfman McInnes } else { 21264e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21274e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21284e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21294e220ebcSLois Curfman McInnes } 21303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 213117ab2063SBarry Smith } 213217ab2063SBarry Smith 2133ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2134d71ae5a4SJacob Faibussowitsch { 2135416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2136c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 213797b48c8fSBarry Smith const PetscScalar *xx; 21382e5835c6SStefano Zampini PetscScalar *bb, *aa; 2139c7da8527SEric Chamberland PetscInt d = 0; 214017ab2063SBarry Smith 21413a40ed3dSBarry Smith PetscFunctionBegin; 214297b48c8fSBarry Smith if (x && b) { 21439566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21449566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 214597b48c8fSBarry Smith for (i = 0; i < N; i++) { 2146aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2147447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 214897b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 214997b48c8fSBarry Smith } 21509566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21519566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 215297b48c8fSBarry Smith } 215397b48c8fSBarry Smith 21549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2155a9817697SBarry Smith if (a->keepnonzeropattern) { 2156f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2157aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21589566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2159f1e2ffcdSBarry Smith } 2160f4df32b1SMatthew Knepley if (diag != 0.0) { 2161c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2162c7da8527SEric Chamberland d = rows[i]; 2163447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 216408401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2165c7da8527SEric Chamberland } 2166f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2167447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21682e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2169f1e2ffcdSBarry Smith } 2170f1e2ffcdSBarry Smith } 2171f1e2ffcdSBarry Smith } else { 2172f4df32b1SMatthew Knepley if (diag != 0.0) { 217317ab2063SBarry Smith for (i = 0; i < N; i++) { 2174aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21757ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2176447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2177447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2178447d62f5SStefano Zampini } else { 2179416022c9SBarry Smith a->ilen[rows[i]] = 1; 21802e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2181bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2182447d62f5SStefano Zampini } 2183447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21849566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 218517ab2063SBarry Smith } 218617ab2063SBarry Smith } 21873a40ed3dSBarry Smith } else { 218817ab2063SBarry Smith for (i = 0; i < N; i++) { 2189aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2190416022c9SBarry Smith a->ilen[rows[i]] = 0; 219117ab2063SBarry Smith } 219217ab2063SBarry Smith } 2193e56f5c9eSBarry Smith A->nonzerostate++; 2194f1e2ffcdSBarry Smith } 21959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2196dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 219817ab2063SBarry Smith } 219917ab2063SBarry Smith 2200ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2201d71ae5a4SJacob Faibussowitsch { 22026e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22036e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 22042b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 22056e169961SBarry Smith const PetscScalar *xx; 22062e5835c6SStefano Zampini PetscScalar *bb, *aa; 22076e169961SBarry Smith 22086e169961SBarry Smith PetscFunctionBegin; 22093ba16761SJacob Faibussowitsch if (!N) PetscFunctionReturn(PETSC_SUCCESS); 22109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 22116e169961SBarry Smith if (x && b) { 22129566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 22139566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 22142b40b63fSBarry Smith vecs = PETSC_TRUE; 22156e169961SBarry Smith } 22169566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 22176e169961SBarry Smith for (i = 0; i < N; i++) { 2218aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 22198e3a54c0SPierre Jolivet PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]])); 22202205254eSKarl Rupp 22216e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22226e169961SBarry Smith } 22236e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22246e169961SBarry Smith if (!zeroed[i]) { 22256e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22264cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22272e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22282e5835c6SStefano Zampini aa[j] = 0.0; 22296e169961SBarry Smith } 22306e169961SBarry Smith } 22314cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22326e169961SBarry Smith } 22336e169961SBarry Smith if (x && b) { 22349566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22359566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22366e169961SBarry Smith } 22379566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22386e169961SBarry Smith if (diag != 0.0) { 22399566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22401d5a398dSstefano_zampini if (missing) { 22411d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22424cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2243aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22449566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22451d5a398dSstefano_zampini } 22461d5a398dSstefano_zampini } else { 2247ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22486e169961SBarry Smith } 22491d5a398dSstefano_zampini } 22509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2251dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22536e169961SBarry Smith } 22546e169961SBarry Smith 2255d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2256d71ae5a4SJacob Faibussowitsch { 2257fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2258fff043a9SJunchao Zhang const PetscScalar *aa; 225917ab2063SBarry Smith 22603a40ed3dSBarry Smith PetscFunctionBegin; 22619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2262416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22638e3a54c0SPierre Jolivet if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]); 226417ab2063SBarry Smith if (idx) { 22655c0db29aSPierre Jolivet if (*nz && a->j) *idx = a->j + a->i[row]; 2266f4259b30SLisandro Dalcin else *idx = NULL; 226717ab2063SBarry Smith } 22689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 227017ab2063SBarry Smith } 227117ab2063SBarry Smith 2272d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2273d71ae5a4SJacob Faibussowitsch { 22743a40ed3dSBarry Smith PetscFunctionBegin; 22753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 227617ab2063SBarry Smith } 227717ab2063SBarry Smith 2278ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2279d71ae5a4SJacob Faibussowitsch { 2280416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22812e5835c6SStefano Zampini const MatScalar *v; 228236db0b34SBarry Smith PetscReal sum = 0.0; 228397f1f81fSBarry Smith PetscInt i, j; 228417ab2063SBarry Smith 22853a40ed3dSBarry Smith PetscFunctionBegin; 22869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 228717ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2288570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2289570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2290792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2291570b7f6dSBarry Smith #else 2292416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22939371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22949371c9d4SSatish Balay v++; 229517ab2063SBarry Smith } 22968f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2297570b7f6dSBarry Smith #endif 22989566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22993a40ed3dSBarry Smith } else if (type == NORM_1) { 230036db0b34SBarry Smith PetscReal *tmp; 230197f1f81fSBarry Smith PetscInt *jj = a->j; 23029566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2303064f8208SBarry Smith *nrm = 0.0; 2304416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 23059371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 23069371c9d4SSatish Balay v++; 230717ab2063SBarry Smith } 2308d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2309064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 231017ab2063SBarry Smith } 23119566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 23129566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 23133a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2314064f8208SBarry Smith *nrm = 0.0; 2315d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 23168e3a54c0SPierre Jolivet const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]); 231717ab2063SBarry Smith sum = 0.0; 2318416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23199371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23209371c9d4SSatish Balay v2++; 232117ab2063SBarry Smith } 2322064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 232317ab2063SBarry Smith } 23249566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2325f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 232817ab2063SBarry Smith } 232917ab2063SBarry Smith 2330ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2331d71ae5a4SJacob Faibussowitsch { 23323d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 233354f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23342e5835c6SStefano Zampini const MatScalar *va, *vb; 233597f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2336cd0d46ebSvictorle 2337cd0d46ebSvictorle PetscFunctionBegin; 23389566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23399566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23405485867bSBarry Smith if (ma != nb || na != mb) { 23415485867bSBarry Smith *f = PETSC_FALSE; 23423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23435485867bSBarry Smith } 23449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23469371c9d4SSatish Balay aii = aij->i; 23479371c9d4SSatish Balay bii = bij->i; 23489371c9d4SSatish Balay adx = aij->j; 23499371c9d4SSatish Balay bdx = bij->j; 23509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2352cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2353cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2354cd0d46ebSvictorle 2355cd0d46ebSvictorle *f = PETSC_TRUE; 2356cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2357cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 235897f1f81fSBarry Smith PetscInt idc, idr; 23595485867bSBarry Smith PetscScalar vc, vr; 2360cd0d46ebSvictorle /* column/row index/value */ 23615485867bSBarry Smith idc = adx[aptr[i]]; 23625485867bSBarry Smith idr = bdx[bptr[idc]]; 23635485867bSBarry Smith vc = va[aptr[i]]; 23645485867bSBarry Smith vr = vb[bptr[idc]]; 23655485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23665485867bSBarry Smith *f = PETSC_FALSE; 23675485867bSBarry Smith goto done; 2368cd0d46ebSvictorle } else { 23695485867bSBarry Smith aptr[i]++; 23705485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2371cd0d46ebSvictorle } 2372cd0d46ebSvictorle } 2373cd0d46ebSvictorle } 2374cd0d46ebSvictorle done: 23759566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23769566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 23793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2380cd0d46ebSvictorle } 2381cd0d46ebSvictorle 2382ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2383d71ae5a4SJacob Faibussowitsch { 23843d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 238554f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 238654f21887SBarry Smith MatScalar *va, *vb; 23871cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23881cbb95d3SBarry Smith 23891cbb95d3SBarry Smith PetscFunctionBegin; 23909566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23919566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23921cbb95d3SBarry Smith if (ma != nb || na != mb) { 23931cbb95d3SBarry Smith *f = PETSC_FALSE; 23943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23951cbb95d3SBarry Smith } 23969371c9d4SSatish Balay aii = aij->i; 23979371c9d4SSatish Balay bii = bij->i; 23989371c9d4SSatish Balay adx = aij->j; 23999371c9d4SSatish Balay bdx = bij->j; 24009371c9d4SSatish Balay va = aij->a; 24019371c9d4SSatish Balay vb = bij->a; 24029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 24039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 24041cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 24051cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 24061cbb95d3SBarry Smith 24071cbb95d3SBarry Smith *f = PETSC_TRUE; 24081cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 24091cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 24101cbb95d3SBarry Smith PetscInt idc, idr; 24111cbb95d3SBarry Smith PetscScalar vc, vr; 24121cbb95d3SBarry Smith /* column/row index/value */ 24131cbb95d3SBarry Smith idc = adx[aptr[i]]; 24141cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24151cbb95d3SBarry Smith vc = va[aptr[i]]; 24161cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24171cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24181cbb95d3SBarry Smith *f = PETSC_FALSE; 24191cbb95d3SBarry Smith goto done; 24201cbb95d3SBarry Smith } else { 24211cbb95d3SBarry Smith aptr[i]++; 24221cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24231cbb95d3SBarry Smith } 24241cbb95d3SBarry Smith } 24251cbb95d3SBarry Smith } 24261cbb95d3SBarry Smith done: 24279566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24289566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24301cbb95d3SBarry Smith } 24311cbb95d3SBarry Smith 2432d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2433d71ae5a4SJacob Faibussowitsch { 2434416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2435fff8e43fSBarry Smith const PetscScalar *l, *r; 2436fff8e43fSBarry Smith PetscScalar x; 243754f21887SBarry Smith MatScalar *v; 2438fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2439fff8e43fSBarry Smith const PetscInt *jj; 244017ab2063SBarry Smith 24413a40ed3dSBarry Smith PetscFunctionBegin; 244217ab2063SBarry Smith if (ll) { 24433ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24443ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24459566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 244608401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24479566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 244917ab2063SBarry Smith for (i = 0; i < m; i++) { 245017ab2063SBarry Smith x = l[i]; 2451416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24522205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 245317ab2063SBarry Smith } 24549566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24559566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 245717ab2063SBarry Smith } 245817ab2063SBarry Smith if (rr) { 24599566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 246008401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24619566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24632e5835c6SStefano Zampini jj = a->j; 24642205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24669566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24679566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 246817ab2063SBarry Smith } 24699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 247117ab2063SBarry Smith } 247217ab2063SBarry Smith 2473d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2474d71ae5a4SJacob Faibussowitsch { 2475db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2476d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 247797f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24785d0c19d7SBarry Smith const PetscInt *irow, *icol; 24792e5835c6SStefano Zampini const PetscScalar *aa; 24805d0c19d7SBarry Smith PetscInt nrows, ncols; 248197f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 2482fb3c7e2dSJunchao Zhang MatScalar *a_new, *mat_a, *c_a; 2483416022c9SBarry Smith Mat C; 2484cdc6f3adSToby Isaac PetscBool stride; 248517ab2063SBarry Smith 24863a40ed3dSBarry Smith PetscFunctionBegin; 24879566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24889566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24899566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 249017ab2063SBarry Smith 24919566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2492ff718158SBarry Smith if (stride) { 24939566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2494ff718158SBarry Smith } else { 2495ff718158SBarry Smith first = 0; 2496ff718158SBarry Smith step = 0; 2497ff718158SBarry Smith } 2498fee21e36SBarry Smith if (stride && step == 1) { 249902834360SBarry Smith /* special case of contiguous rows */ 25009566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 250102834360SBarry Smith /* loop over new rows determining lens and starting points */ 250202834360SBarry Smith for (i = 0; i < nrows; i++) { 2503bfeeae90SHong Zhang kstart = ai[irow[i]]; 2504a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2505a91a9bebSLisandro Dalcin starts[i] = kstart; 250602834360SBarry Smith for (k = kstart; k < kend; k++) { 2507bfeeae90SHong Zhang if (aj[k] >= first) { 250802834360SBarry Smith starts[i] = k; 250902834360SBarry Smith break; 251002834360SBarry Smith } 251102834360SBarry Smith } 2512a2744918SBarry Smith sum = 0; 251302834360SBarry Smith while (k < kend) { 2514bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2515a2744918SBarry Smith sum++; 251602834360SBarry Smith } 2517a2744918SBarry Smith lens[i] = sum; 251802834360SBarry Smith } 251902834360SBarry Smith /* create submatrix */ 2520cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 252197f1f81fSBarry Smith PetscInt n_cols, n_rows; 25229566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2523aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25249566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 252508480c60SBarry Smith C = *B; 25263a40ed3dSBarry Smith } else { 25273bef6203SJed Brown PetscInt rbs, cbs; 25289566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25299566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25309566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25319566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25329566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25339566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 253508480c60SBarry Smith } 2536db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2537db02288aSLois Curfman McInnes 253802834360SBarry Smith /* loop over rows inserting into submatrix */ 2539fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C 2540db02288aSLois Curfman McInnes j_new = c->j; 2541db02288aSLois Curfman McInnes i_new = c->i; 25429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 254302834360SBarry Smith for (i = 0; i < nrows; i++) { 2544a2744918SBarry Smith ii = starts[i]; 2545a2744918SBarry Smith lensi = lens[i]; 2546810441c8SPierre Jolivet if (lensi) { 2547ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25489566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2549a2744918SBarry Smith a_new += lensi; 2550810441c8SPierre Jolivet } 2551a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2552a2744918SBarry Smith c->ilen[i] = lensi; 255302834360SBarry Smith } 2554fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly 25559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25569566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25573a40ed3dSBarry Smith } else { 25589566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25599566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25609566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25614dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25626bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25634dcab191SBarry Smith smap[icol[i]] = i + 1; 25644dcab191SBarry Smith } 25654dcab191SBarry Smith 256602834360SBarry Smith /* determine lens of each row */ 256702834360SBarry Smith for (i = 0; i < nrows; i++) { 2568bfeeae90SHong Zhang kstart = ai[irow[i]]; 256902834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 257002834360SBarry Smith lens[i] = 0; 257102834360SBarry Smith for (k = kstart; k < kend; k++) { 2572ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 257302834360SBarry Smith } 257402834360SBarry Smith } 257517ab2063SBarry Smith /* Create and fill new matrix */ 2576a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2577ace3abfcSBarry Smith PetscBool equal; 25780f5bd95cSBarry Smith 257999141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2580aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25819566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 2582fdfbdca6SPierre Jolivet PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros"); 25839566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 258408480c60SBarry Smith C = *B; 25853a40ed3dSBarry Smith } else { 25863bef6203SJed Brown PetscInt rbs, cbs; 25879566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25889566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25899566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25909566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 259137a5e0faSPierre Jolivet if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25929566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 259408480c60SBarry Smith } 25959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2596fb3c7e2dSJunchao Zhang 2597f4f49eeaSPierre Jolivet c = (Mat_SeqAIJ *)C->data; 2598fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C 259917ab2063SBarry Smith for (i = 0; i < nrows; i++) { 260099141d43SSatish Balay row = irow[i]; 2601bfeeae90SHong Zhang kstart = ai[row]; 260299141d43SSatish Balay kend = kstart + a->ilen[row]; 2603bfeeae90SHong Zhang mat_i = c->i[i]; 26048e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 26058e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 260699141d43SSatish Balay mat_ilen = c->ilen + i; 260717ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2608bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2609ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26102e5835c6SStefano Zampini *mat_a++ = aa[k]; 261199141d43SSatish Balay (*mat_ilen)++; 261217ab2063SBarry Smith } 261317ab2063SBarry Smith } 261417ab2063SBarry Smith } 26159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 261602834360SBarry Smith /* Free work space */ 26179566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26189566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26199566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2620cdc6f3adSToby Isaac /* sort */ 2621cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2622cdc6f3adSToby Isaac PetscInt ilen; 2623cdc6f3adSToby Isaac 2624cdc6f3adSToby Isaac mat_i = c->i[i]; 26258e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 26268e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 2627cdc6f3adSToby Isaac ilen = c->ilen[i]; 26289566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2629cdc6f3adSToby Isaac } 2630fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a)); 263102834360SBarry Smith } 26328c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26339566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2634305c6ccfSStefano Zampini #endif 26359566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26369566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 263717ab2063SBarry Smith 26389566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2639416022c9SBarry Smith *B = C; 26403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 264117ab2063SBarry Smith } 264217ab2063SBarry Smith 2643ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2644d71ae5a4SJacob Faibussowitsch { 264582d44351SHong Zhang Mat B; 264682d44351SHong Zhang 264782d44351SHong Zhang PetscFunctionBegin; 2648c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26499566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26509566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26519566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26529566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26539566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 265482d44351SHong Zhang *subMat = B; 2655c2d650bdSHong Zhang } else { 26569566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2657c2d650bdSHong Zhang } 26583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 265982d44351SHong Zhang } 266082d44351SHong Zhang 2661ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2662d71ae5a4SJacob Faibussowitsch { 266363b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 266463b91edcSBarry Smith Mat outA; 2665ace3abfcSBarry Smith PetscBool row_identity, col_identity; 266663b91edcSBarry Smith 26673a40ed3dSBarry Smith PetscFunctionBegin; 266808401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26691df811f5SHong Zhang 26709566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26719566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2672a871dcd8SBarry Smith 267363b91edcSBarry Smith outA = inA; 2674d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26759566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26769566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26772205254eSKarl Rupp 26789566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26799566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26802205254eSKarl Rupp 2681c3122656SLisandro Dalcin a->row = row; 26822205254eSKarl Rupp 26839566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26849566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26852205254eSKarl Rupp 2686c3122656SLisandro Dalcin a->col = col; 268763b91edcSBarry Smith 268836db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26899566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26909566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2691f0ec6fceSSatish Balay 269294a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26939566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 269494a9d846SBarry Smith } 269563b91edcSBarry Smith 26969566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2697137fb511SHong Zhang if (row_identity && col_identity) { 26989566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2699137fb511SHong Zhang } else { 27009566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2701137fb511SHong Zhang } 27023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2703a871dcd8SBarry Smith } 2704a871dcd8SBarry Smith 2705d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2706d71ae5a4SJacob Faibussowitsch { 2707f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2708dfa0f9e5SStefano Zampini PetscScalar *v; 2709c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 27103a40ed3dSBarry Smith 27113a40ed3dSBarry Smith PetscFunctionBegin; 27129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27139566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2714792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27159566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2719f0b747eeSBarry Smith } 2720f0b747eeSBarry Smith 2721d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2722d71ae5a4SJacob Faibussowitsch { 272316b64355SHong Zhang PetscInt i; 272416b64355SHong Zhang 272516b64355SHong Zhang PetscFunctionBegin; 272616b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27279566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 272816b64355SHong Zhang 272948a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27309566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 273116b64355SHong Zhang 273216b64355SHong Zhang if (submatj->rbuf1) { 27339566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27349566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 273516b64355SHong Zhang } 273616b64355SHong Zhang 273748a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27389566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27399566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 274016b64355SHong Zhang } 274116b64355SHong Zhang 274216b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2743eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 27449566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27459566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 274616b64355SHong Zhang #else 27479566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 274816b64355SHong Zhang #endif 274916b64355SHong Zhang 275016b64355SHong Zhang if (!submatj->allcolumns) { 275116b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2752835f2295SStefano Zampini PetscCall(PetscHMapIDestroy(&submatj->cmap)); 275316b64355SHong Zhang #else 27549566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 275516b64355SHong Zhang #endif 275616b64355SHong Zhang } 27579566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 275816b64355SHong Zhang 27599566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 27603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 276116b64355SHong Zhang } 276216b64355SHong Zhang 2763d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2764d71ae5a4SJacob Faibussowitsch { 276516b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27665c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 276716b64355SHong Zhang 276816b64355SHong Zhang PetscFunctionBegin; 27699566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27709566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 277216b64355SHong Zhang } 277316b64355SHong Zhang 277489a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2775ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2776d71ae5a4SJacob Faibussowitsch { 27772d033e1fSHong Zhang PetscInt i; 27780fb991dcSHong Zhang Mat C; 27790fb991dcSHong Zhang Mat_SeqAIJ *c; 27800fb991dcSHong Zhang Mat_SubSppt *submatj; 27812d033e1fSHong Zhang 27822d033e1fSHong Zhang PetscFunctionBegin; 27832d033e1fSHong Zhang for (i = 0; i < n; i++) { 27840fb991dcSHong Zhang C = (*mat)[i]; 27850fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27860fb991dcSHong Zhang submatj = c->submatis1; 27872d033e1fSHong Zhang if (submatj) { 2788682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 278926cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27909566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27919566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27929566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27933faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27949566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27959566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27969566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2797682e4c99SStefano Zampini } 27982d033e1fSHong Zhang } else { 27999566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 28002d033e1fSHong Zhang } 28012d033e1fSHong Zhang } 280286e85357SHong Zhang 280363a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 28049566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 280563a75b2aSHong Zhang 28069566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 28073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28082d033e1fSHong Zhang } 28092d033e1fSHong Zhang 2810ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2811d71ae5a4SJacob Faibussowitsch { 281297f1f81fSBarry Smith PetscInt i; 2813cddf8d76SBarry Smith 28143a40ed3dSBarry Smith PetscFunctionBegin; 281548a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2816cddf8d76SBarry Smith 281748a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2819cddf8d76SBarry Smith } 2820cddf8d76SBarry Smith 2821ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2822d71ae5a4SJacob Faibussowitsch { 2823e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28249a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28255d0c19d7SBarry Smith const PetscInt *idx; 28269a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2827f1af5d2fSBarry Smith PetscBT table; 2828bbd702dbSSatish Balay 28293a40ed3dSBarry Smith PetscFunctionBegin; 28309a88ca10SBarry Smith m = A->rmap->n / bs; 2831e4d965acSSatish Balay ai = a->i; 2832bfeeae90SHong Zhang aj = a->j; 28338a047759SSatish Balay 283408401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 283506763907SSatish Balay 28369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28379566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 283806763907SSatish Balay 2839e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2840b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2841e4d965acSSatish Balay isz = 0; 28429566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2843e4d965acSSatish Balay 2844e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28459566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28469566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2847e4d965acSSatish Balay 28489a88ca10SBarry Smith if (bs > 1) { 28499a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28509a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28519a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28529a88ca10SBarry Smith } 28539a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28549a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28559a88ca10SBarry Smith 28569a88ca10SBarry Smith k = 0; 28579a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28589a88ca10SBarry Smith n = isz; 28599a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28609a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28619a88ca10SBarry Smith row = bs * nidx[k] + ll; 28629a88ca10SBarry Smith start = ai[row]; 28639a88ca10SBarry Smith end = ai[row + 1]; 28649a88ca10SBarry Smith for (l = start; l < end; l++) { 28659a88ca10SBarry Smith val = aj[l] / bs; 28669a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28679a88ca10SBarry Smith } 28689a88ca10SBarry Smith } 28699a88ca10SBarry Smith } 28709a88ca10SBarry Smith } 287157508eceSPierre Jolivet PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, is + i)); 28729a88ca10SBarry Smith } else { 2873dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2874e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28752205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28764dcbc457SBarry Smith } 28779566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28789566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2879e4d965acSSatish Balay 288004a348a9SBarry Smith k = 0; 288104a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 288204a348a9SBarry Smith n = isz; 288306763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2884e4d965acSSatish Balay row = nidx[k]; 2885e4d965acSSatish Balay start = ai[row]; 2886e4d965acSSatish Balay end = ai[row + 1]; 288704a348a9SBarry Smith for (l = start; l < end; l++) { 2888efb16452SHong Zhang val = aj[l]; 28892205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2890e4d965acSSatish Balay } 2891e4d965acSSatish Balay } 2892e4d965acSSatish Balay } 289357508eceSPierre Jolivet PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, is + i)); 2894e4d965acSSatish Balay } 28959a88ca10SBarry Smith } 28969566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28979566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28994dcbc457SBarry Smith } 290017ab2063SBarry Smith 2901ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2902d71ae5a4SJacob Faibussowitsch { 29030513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29043b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 29055d0c19d7SBarry Smith const PetscInt *row, *col; 29065d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 290756cd22aeSBarry Smith IS icolp, irowp; 29080298fd71SBarry Smith PetscInt *cwork = NULL; 29090298fd71SBarry Smith PetscScalar *vwork = NULL; 29100513a670SBarry Smith 29113a40ed3dSBarry Smith PetscFunctionBegin; 29129566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29139566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29149566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29159566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29160513a670SBarry Smith 29170513a670SBarry Smith /* determine lengths of permuted rows */ 29189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29192205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29209566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29219566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29229566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29239566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29259566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29260513a670SBarry Smith 29279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29280513a670SBarry Smith for (i = 0; i < m; i++) { 29299566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29302205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29319566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29329566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29330513a670SBarry Smith } 29349566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29352205254eSKarl Rupp 29363c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29372205254eSKarl Rupp 29388c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29399566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29409fe5e383SStefano Zampini #endif 29419566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29429566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29439566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29449566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29459566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29469566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 294748a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29490513a670SBarry Smith } 29500513a670SBarry Smith 2951d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2952d71ae5a4SJacob Faibussowitsch { 2953cb5b572fSBarry Smith PetscFunctionBegin; 295433f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 295533f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2956be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2957be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29582e5835c6SStefano Zampini const PetscScalar *aa; 2959be6bf707SBarry Smith 29609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 296108401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29629566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29639566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2965cb5b572fSBarry Smith } else { 29669566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2967cb5b572fSBarry Smith } 29683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2969cb5b572fSBarry Smith } 2970cb5b572fSBarry Smith 2971d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2972d71ae5a4SJacob Faibussowitsch { 29736c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29746e111a19SKarl Rupp 29756c0721eeSBarry Smith PetscFunctionBegin; 29766c0721eeSBarry Smith *array = a->a; 29773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29786c0721eeSBarry Smith } 29796c0721eeSBarry Smith 2980d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2981d71ae5a4SJacob Faibussowitsch { 29826c0721eeSBarry Smith PetscFunctionBegin; 2983f38c1e66SStefano Zampini *array = NULL; 29843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29856c0721eeSBarry Smith } 2986273d9f13SBarry Smith 29878229c054SShri Abhyankar /* 29888229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29898229c054SShri Abhyankar have different nonzero structure. 29908229c054SShri Abhyankar */ 2991d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2992d71ae5a4SJacob Faibussowitsch { 2993b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2994ec7775f6SShri Abhyankar 2995ec7775f6SShri Abhyankar PetscFunctionBegin; 2996ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2997ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 29988e3a54c0SPierre Jolivet const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]); 2999b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 3000b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 30018af7cee1SJed Brown nnz[i] = 0; 30028af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 3003b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 3004b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 30058af7cee1SJed Brown nnz[i]++; 30068af7cee1SJed Brown } 30078af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 3008ec7775f6SShri Abhyankar } 30093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3010ec7775f6SShri Abhyankar } 3011ec7775f6SShri Abhyankar 3012d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3013d71ae5a4SJacob Faibussowitsch { 3014b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3015b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3016b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3017b264fe52SHong Zhang 3018b264fe52SHong Zhang PetscFunctionBegin; 3019b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30209566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 30213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3022b264fe52SHong Zhang } 3023b264fe52SHong Zhang 3024d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3025d71ae5a4SJacob Faibussowitsch { 3026ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3027ac90fabeSBarry Smith 3028ac90fabeSBarry Smith PetscFunctionBegin; 3029134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3030134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3031134adf20SPierre Jolivet if (e) { 30329566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 303381fa06acSBarry Smith if (e) { 30349566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3035134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 303681fa06acSBarry Smith } 303781fa06acSBarry Smith } 303854c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 303981fa06acSBarry Smith } 3040ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30412e5835c6SStefano Zampini const PetscScalar *xa; 30422e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 304381fa06acSBarry Smith PetscBLASInt one = 1, bnz; 304481fa06acSBarry Smith 30459566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3048792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30519566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30539566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3054ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30559566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3056ac90fabeSBarry Smith } else { 30578229c054SShri Abhyankar Mat B; 30588229c054SShri Abhyankar PetscInt *nnz; 30599566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30609566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30619566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30629566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30639566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30649566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30669566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30679566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30689bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30699566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3070ac90fabeSBarry Smith } 30713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3072ac90fabeSBarry Smith } 3073ac90fabeSBarry Smith 3074d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3075d71ae5a4SJacob Faibussowitsch { 3076354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3077354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3078354c94deSBarry Smith PetscInt i, nz; 3079354c94deSBarry Smith PetscScalar *a; 3080354c94deSBarry Smith 3081354c94deSBarry Smith PetscFunctionBegin; 3082354c94deSBarry Smith nz = aij->nz; 30839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30842205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3086354c94deSBarry Smith #else 3087354c94deSBarry Smith PetscFunctionBegin; 3088354c94deSBarry Smith #endif 30893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3090354c94deSBarry Smith } 3091354c94deSBarry Smith 3092ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3093d71ae5a4SJacob Faibussowitsch { 3094e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3095d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3096e34fafa9SBarry Smith PetscReal atmp; 3097985db425SBarry Smith PetscScalar *x; 3098ce496241SStefano Zampini const MatScalar *aa, *av; 3099e34fafa9SBarry Smith 3100e34fafa9SBarry Smith PetscFunctionBegin; 310128b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3103ce496241SStefano Zampini aa = av; 3104e34fafa9SBarry Smith ai = a->i; 3105e34fafa9SBarry Smith aj = a->j; 3106e34fafa9SBarry Smith 31079566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31089566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31099566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 311008401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3111e34fafa9SBarry Smith for (i = 0; i < m; i++) { 31129371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31139371c9d4SSatish Balay ai++; 3114e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3115985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31169371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31179371c9d4SSatish Balay x[i] = atmp; 31189371c9d4SSatish Balay if (idx) idx[i] = *aj; 31199371c9d4SSatish Balay } 31209371c9d4SSatish Balay aa++; 31219371c9d4SSatish Balay aj++; 3122985db425SBarry Smith } 3123985db425SBarry Smith } 31249566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3127985db425SBarry Smith } 3128985db425SBarry Smith 3129eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v) 3130eede4a3fSMark Adams { 3131eede4a3fSMark Adams Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3132eede4a3fSMark Adams PetscInt i, j, m = A->rmap->n, *ai, ncols, n; 3133eede4a3fSMark Adams PetscScalar *x; 3134eede4a3fSMark Adams const MatScalar *aa, *av; 3135eede4a3fSMark Adams 3136eede4a3fSMark Adams PetscFunctionBegin; 3137eede4a3fSMark Adams PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3138eede4a3fSMark Adams PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3139eede4a3fSMark Adams aa = av; 3140eede4a3fSMark Adams ai = a->i; 3141eede4a3fSMark Adams 3142eede4a3fSMark Adams PetscCall(VecSet(v, 0.0)); 3143eede4a3fSMark Adams PetscCall(VecGetArrayWrite(v, &x)); 3144eede4a3fSMark Adams PetscCall(VecGetLocalSize(v, &n)); 3145eede4a3fSMark Adams PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3146eede4a3fSMark Adams for (i = 0; i < m; i++) { 3147eede4a3fSMark Adams ncols = ai[1] - ai[0]; 3148eede4a3fSMark Adams ai++; 3149eede4a3fSMark Adams for (j = 0; j < ncols; j++) { 3150eede4a3fSMark Adams x[i] += PetscAbsScalar(*aa); 3151eede4a3fSMark Adams aa++; 3152eede4a3fSMark Adams } 3153eede4a3fSMark Adams } 3154eede4a3fSMark Adams PetscCall(VecRestoreArrayWrite(v, &x)); 3155eede4a3fSMark Adams PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3156eede4a3fSMark Adams PetscFunctionReturn(PETSC_SUCCESS); 3157eede4a3fSMark Adams } 3158eede4a3fSMark Adams 3159ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3160d71ae5a4SJacob Faibussowitsch { 3161985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3162d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3163985db425SBarry Smith PetscScalar *x; 3164ce496241SStefano Zampini const MatScalar *aa, *av; 3165985db425SBarry Smith 3166985db425SBarry Smith PetscFunctionBegin; 316728b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3169ce496241SStefano Zampini aa = av; 3170985db425SBarry Smith ai = a->i; 3171985db425SBarry Smith aj = a->j; 3172985db425SBarry Smith 31739566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31749566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31759566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 317608401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3177985db425SBarry Smith for (i = 0; i < m; i++) { 31789371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31799371c9d4SSatish Balay ai++; 3180d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31819371c9d4SSatish Balay x[i] = *aa; 31829371c9d4SSatish Balay if (idx) idx[i] = 0; 3183985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3184985db425SBarry Smith x[i] = 0.0; 3185985db425SBarry Smith if (idx) { 3186985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3187985db425SBarry Smith if (aj[j] > j) { 3188985db425SBarry Smith idx[i] = j; 3189985db425SBarry Smith break; 3190985db425SBarry Smith } 3191985db425SBarry Smith } 31921a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31931a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3194985db425SBarry Smith } 3195985db425SBarry Smith } 3196985db425SBarry Smith for (j = 0; j < ncols; j++) { 31979371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31989371c9d4SSatish Balay x[i] = *aa; 31999371c9d4SSatish Balay if (idx) idx[i] = *aj; 32009371c9d4SSatish Balay } 32019371c9d4SSatish Balay aa++; 32029371c9d4SSatish Balay aj++; 3203985db425SBarry Smith } 3204985db425SBarry Smith } 32059566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3208985db425SBarry Smith } 3209985db425SBarry Smith 3210ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3211d71ae5a4SJacob Faibussowitsch { 3212c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3213c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3214ce496241SStefano Zampini PetscScalar *x; 3215ce496241SStefano Zampini const MatScalar *aa, *av; 3216c87e5d42SMatthew Knepley 3217c87e5d42SMatthew Knepley PetscFunctionBegin; 32189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3219ce496241SStefano Zampini aa = av; 3220c87e5d42SMatthew Knepley ai = a->i; 3221c87e5d42SMatthew Knepley aj = a->j; 3222c87e5d42SMatthew Knepley 32239566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32249566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32259566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 322608401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3227c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 32289371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32299371c9d4SSatish Balay ai++; 3230f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32319371c9d4SSatish Balay x[i] = *aa; 32329371c9d4SSatish Balay if (idx) idx[i] = 0; 3233f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3234f07e67edSHong Zhang x[i] = 0.0; 3235f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3236289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3237f07e67edSHong Zhang if (aj[j] > j) { 3238f07e67edSHong Zhang idx[i] = j; 32392205254eSKarl Rupp break; 32402205254eSKarl Rupp } 3241289a08f5SMatthew Knepley } 3242f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3243f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3244f07e67edSHong Zhang } 3245289a08f5SMatthew Knepley } 3246c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32479371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32489371c9d4SSatish Balay x[i] = *aa; 32499371c9d4SSatish Balay if (idx) idx[i] = *aj; 32509371c9d4SSatish Balay } 32519371c9d4SSatish Balay aa++; 32529371c9d4SSatish Balay aj++; 3253c87e5d42SMatthew Knepley } 3254c87e5d42SMatthew Knepley } 32559566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3258c87e5d42SMatthew Knepley } 3259c87e5d42SMatthew Knepley 3260ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3261d71ae5a4SJacob Faibussowitsch { 3262985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3263d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3264d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3265985db425SBarry Smith PetscScalar *x; 3266ce496241SStefano Zampini const MatScalar *aa, *av; 3267985db425SBarry Smith 3268985db425SBarry Smith PetscFunctionBegin; 326928b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3271ce496241SStefano Zampini aa = av; 3272985db425SBarry Smith ai = a->i; 3273985db425SBarry Smith aj = a->j; 3274985db425SBarry Smith 32759566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32769566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32779566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 327808401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3279985db425SBarry Smith for (i = 0; i < m; i++) { 32809371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32819371c9d4SSatish Balay ai++; 3282d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32839371c9d4SSatish Balay x[i] = *aa; 32849371c9d4SSatish Balay if (idx) idx[i] = 0; 3285985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3286985db425SBarry Smith x[i] = 0.0; 3287985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3288985db425SBarry Smith for (j = 0; j < ncols; j++) { 3289985db425SBarry Smith if (aj[j] > j) { 3290985db425SBarry Smith idx[i] = j; 3291985db425SBarry Smith break; 3292985db425SBarry Smith } 3293985db425SBarry Smith } 3294fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3295fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3296985db425SBarry Smith } 3297985db425SBarry Smith } 3298985db425SBarry Smith for (j = 0; j < ncols; j++) { 32999371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 33009371c9d4SSatish Balay x[i] = *aa; 33019371c9d4SSatish Balay if (idx) idx[i] = *aj; 33029371c9d4SSatish Balay } 33039371c9d4SSatish Balay aa++; 33049371c9d4SSatish Balay aj++; 3305e34fafa9SBarry Smith } 3306e34fafa9SBarry Smith } 33079566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 33089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 33093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3310e34fafa9SBarry Smith } 3311bbead8a2SBarry Smith 3312ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3313d71ae5a4SJacob Faibussowitsch { 3314bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 331533d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3316bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 33170da83c2eSBarry Smith const PetscReal shift = 0.0; 33181a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3319bbead8a2SBarry Smith 3320bbead8a2SBarry Smith PetscFunctionBegin; 3321a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 33224a0d0026SBarry Smith if (a->ibdiagvalid) { 33234a0d0026SBarry Smith if (values) *values = a->ibdiag; 33243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 33254a0d0026SBarry Smith } 33269566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 33274dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3328bbead8a2SBarry Smith diag = a->ibdiag; 3329bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3330bbead8a2SBarry Smith /* factor and invert each block */ 3331bbead8a2SBarry Smith switch (bs) { 3332bbead8a2SBarry Smith case 1: 3333bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33349566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3335ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3336ec1892c8SHong Zhang if (allowzeropivot) { 33377b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33387b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33397b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33409566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 334198921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3342ec1892c8SHong Zhang } 3343bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3344bbead8a2SBarry Smith } 3345bbead8a2SBarry Smith break; 3346bbead8a2SBarry Smith case 2: 3347bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33489371c9d4SSatish Balay ij[0] = 2 * i; 33499371c9d4SSatish Balay ij[1] = 2 * i + 1; 33509566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33519566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33527b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33539566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3354bbead8a2SBarry Smith diag += 4; 3355bbead8a2SBarry Smith } 3356bbead8a2SBarry Smith break; 3357bbead8a2SBarry Smith case 3: 3358bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33599371c9d4SSatish Balay ij[0] = 3 * i; 33609371c9d4SSatish Balay ij[1] = 3 * i + 1; 33619371c9d4SSatish Balay ij[2] = 3 * i + 2; 33629566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33639566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33647b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33659566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3366bbead8a2SBarry Smith diag += 9; 3367bbead8a2SBarry Smith } 3368bbead8a2SBarry Smith break; 3369bbead8a2SBarry Smith case 4: 3370bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33719371c9d4SSatish Balay ij[0] = 4 * i; 33729371c9d4SSatish Balay ij[1] = 4 * i + 1; 33739371c9d4SSatish Balay ij[2] = 4 * i + 2; 33749371c9d4SSatish Balay ij[3] = 4 * i + 3; 33759566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33769566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33777b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33789566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3379bbead8a2SBarry Smith diag += 16; 3380bbead8a2SBarry Smith } 3381bbead8a2SBarry Smith break; 3382bbead8a2SBarry Smith case 5: 3383bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33849371c9d4SSatish Balay ij[0] = 5 * i; 33859371c9d4SSatish Balay ij[1] = 5 * i + 1; 33869371c9d4SSatish Balay ij[2] = 5 * i + 2; 33879371c9d4SSatish Balay ij[3] = 5 * i + 3; 33889371c9d4SSatish Balay ij[4] = 5 * i + 4; 33899566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33909566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33917b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33929566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3393bbead8a2SBarry Smith diag += 25; 3394bbead8a2SBarry Smith } 3395bbead8a2SBarry Smith break; 3396bbead8a2SBarry Smith case 6: 3397bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33989371c9d4SSatish Balay ij[0] = 6 * i; 33999371c9d4SSatish Balay ij[1] = 6 * i + 1; 34009371c9d4SSatish Balay ij[2] = 6 * i + 2; 34019371c9d4SSatish Balay ij[3] = 6 * i + 3; 34029371c9d4SSatish Balay ij[4] = 6 * i + 4; 34039371c9d4SSatish Balay ij[5] = 6 * i + 5; 34049566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 34059566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 34067b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34079566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3408bbead8a2SBarry Smith diag += 36; 3409bbead8a2SBarry Smith } 3410bbead8a2SBarry Smith break; 3411bbead8a2SBarry Smith case 7: 3412bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 34139371c9d4SSatish Balay ij[0] = 7 * i; 34149371c9d4SSatish Balay ij[1] = 7 * i + 1; 34159371c9d4SSatish Balay ij[2] = 7 * i + 2; 34169371c9d4SSatish Balay ij[3] = 7 * i + 3; 34179371c9d4SSatish Balay ij[4] = 7 * i + 4; 34189371c9d4SSatish Balay ij[5] = 7 * i + 5; 3419cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 34209566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 34219566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 34227b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34239566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3424bbead8a2SBarry Smith diag += 49; 3425bbead8a2SBarry Smith } 3426bbead8a2SBarry Smith break; 3427bbead8a2SBarry Smith default: 34289566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3429bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3430ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34319566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34329566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34337b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34349566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3435bbead8a2SBarry Smith diag += bs2; 3436bbead8a2SBarry Smith } 34379566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3438bbead8a2SBarry Smith } 3439bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 34403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3441bbead8a2SBarry Smith } 3442bbead8a2SBarry Smith 3443d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3444d71ae5a4SJacob Faibussowitsch { 344573a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3446fff043a9SJunchao Zhang PetscScalar a, *aa; 344773a71a0fSBarry Smith PetscInt m, n, i, j, col; 344873a71a0fSBarry Smith 344973a71a0fSBarry Smith PetscFunctionBegin; 345073a71a0fSBarry Smith if (!x->assembled) { 34519566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 345273a71a0fSBarry Smith for (i = 0; i < m; i++) { 345373a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34549566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 345573a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34569566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 345773a71a0fSBarry Smith } 345873a71a0fSBarry Smith } 3459e2ce353bSJunchao Zhang } else { 34609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34619566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3463e2ce353bSJunchao Zhang } 34649566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34659566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 346773a71a0fSBarry Smith } 346873a71a0fSBarry Smith 3469679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3470d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3471d71ae5a4SJacob Faibussowitsch { 3472679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3473679944adSJunchao Zhang PetscScalar a; 3474679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3475679944adSJunchao Zhang 3476679944adSJunchao Zhang PetscFunctionBegin; 3477679944adSJunchao Zhang nskip = high - low; 34789566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3479679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3480679944adSJunchao Zhang for (i = 0; i < m; i++) { 3481679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34829566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3483679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3484679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34859566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3486679944adSJunchao Zhang } 3487e2ce353bSJunchao Zhang } 34889566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34899566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3491679944adSJunchao Zhang } 3492679944adSJunchao Zhang 34930a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3494cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3495cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3496cb5b572fSBarry Smith MatMult_SeqAIJ, 349797304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34987c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34997c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3500f4259b30SLisandro Dalcin NULL, 3501f4259b30SLisandro Dalcin NULL, 3502f4259b30SLisandro Dalcin NULL, 3503f4259b30SLisandro Dalcin /* 10*/ NULL, 3504cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3505f4259b30SLisandro Dalcin NULL, 350641f059aeSBarry Smith MatSOR_SeqAIJ, 350791e9d3e2SHong Zhang MatTranspose_SeqAIJ, 350897304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3509cb5b572fSBarry Smith MatEqual_SeqAIJ, 3510cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3511cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3512cb5b572fSBarry Smith MatNorm_SeqAIJ, 3513f4259b30SLisandro Dalcin /* 20*/ NULL, 3514cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3515cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3516cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3517d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3518f4259b30SLisandro Dalcin NULL, 3519f4259b30SLisandro Dalcin NULL, 3520f4259b30SLisandro Dalcin NULL, 3521f4259b30SLisandro Dalcin NULL, 352226cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 3523f4259b30SLisandro Dalcin NULL, 3524f4259b30SLisandro Dalcin NULL, 3525f4259b30SLisandro Dalcin NULL, 3526f4259b30SLisandro Dalcin NULL, 3527d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3528f4259b30SLisandro Dalcin NULL, 3529f4259b30SLisandro Dalcin NULL, 3530cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3531f4259b30SLisandro Dalcin NULL, 3532d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35337dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3534cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3535cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3536cb5b572fSBarry Smith MatCopy_SeqAIJ, 3537d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3538cb5b572fSBarry Smith MatScale_SeqAIJ, 35397d68702bSBarry Smith MatShift_SeqAIJ, 354079299369SBarry Smith MatDiagonalSet_SeqAIJ, 35416e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 354273a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35433b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35443b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35453b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3546a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 354793dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3548f4259b30SLisandro Dalcin NULL, 3549f4259b30SLisandro Dalcin NULL, 3550cda55fadSBarry Smith MatPermute_SeqAIJ, 3551f4259b30SLisandro Dalcin NULL, 3552f4259b30SLisandro Dalcin /* 59*/ NULL, 3553b9b97703SBarry Smith MatDestroy_SeqAIJ, 3554b9b97703SBarry Smith MatView_SeqAIJ, 3555f4259b30SLisandro Dalcin NULL, 3556f4259b30SLisandro Dalcin NULL, 3557f4259b30SLisandro Dalcin /* 64*/ NULL, 3558321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3559f4259b30SLisandro Dalcin NULL, 3560f4259b30SLisandro Dalcin NULL, 3561f4259b30SLisandro Dalcin NULL, 3562d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3563c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3564f4259b30SLisandro Dalcin NULL, 3565f4259b30SLisandro Dalcin NULL, 3566f4259b30SLisandro Dalcin NULL, 3567f4259b30SLisandro Dalcin /* 74*/ NULL, 35683acb8795SBarry Smith MatFDColoringApply_AIJ, 3569f4259b30SLisandro Dalcin NULL, 3570f4259b30SLisandro Dalcin NULL, 3571f4259b30SLisandro Dalcin NULL, 35726ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3573f4259b30SLisandro Dalcin NULL, 3574f4259b30SLisandro Dalcin NULL, 3575f4259b30SLisandro Dalcin NULL, 3576bc011b1eSHong Zhang MatLoad_SeqAIJ, 35776cff0a6bSPierre Jolivet /* 84*/ NULL, 35786cff0a6bSPierre Jolivet NULL, 3579f4259b30SLisandro Dalcin NULL, 3580f4259b30SLisandro Dalcin NULL, 3581f4259b30SLisandro Dalcin NULL, 3582f4259b30SLisandro Dalcin /* 89*/ NULL, 3583f4259b30SLisandro Dalcin NULL, 358426be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3585f4259b30SLisandro Dalcin NULL, 3586f4259b30SLisandro Dalcin NULL, 35878fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3588f4259b30SLisandro Dalcin NULL, 3589f4259b30SLisandro Dalcin NULL, 35906fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3591f4259b30SLisandro Dalcin NULL, 35924222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3593f4259b30SLisandro Dalcin NULL, 3594f4259b30SLisandro Dalcin NULL, 359587d4246cSBarry Smith MatConjugate_SeqAIJ, 3596f4259b30SLisandro Dalcin NULL, 3597d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 359899cafbc1SBarry Smith MatRealPart_SeqAIJ, 3599f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3600f4259b30SLisandro Dalcin NULL, 3601f4259b30SLisandro Dalcin NULL, 3602cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3603f4259b30SLisandro Dalcin NULL, 36042af78befSBarry Smith MatGetRowMin_SeqAIJ, 3605f4259b30SLisandro Dalcin NULL, 3606599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3607f4259b30SLisandro Dalcin /*114*/ NULL, 3608f4259b30SLisandro Dalcin NULL, 3609f4259b30SLisandro Dalcin NULL, 3610f4259b30SLisandro Dalcin NULL, 3611f4259b30SLisandro Dalcin NULL, 3612f4259b30SLisandro Dalcin /*119*/ NULL, 3613f4259b30SLisandro Dalcin NULL, 3614f4259b30SLisandro Dalcin NULL, 3615f4259b30SLisandro Dalcin NULL, 3616b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 36170716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3618a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 361937868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 36200da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3621f4259b30SLisandro Dalcin NULL, 3622f4259b30SLisandro Dalcin /*129*/ NULL, 3623f4259b30SLisandro Dalcin NULL, 3624f4259b30SLisandro Dalcin NULL, 362575648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3626b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3627b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36282b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3629f4259b30SLisandro Dalcin NULL, 3630f4259b30SLisandro Dalcin NULL, 36313964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3632f4259b30SLisandro Dalcin /*139*/ NULL, 3633f4259b30SLisandro Dalcin NULL, 3634f4259b30SLisandro Dalcin NULL, 36353a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36369c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36374222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36384222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3639f4259b30SLisandro Dalcin NULL, 364072833a62Smarkadams4 NULL, 364172833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36422d776b49SBarry Smith NULL, 3643dec0b466SHong Zhang /*150*/ MatTransposeSymbolic_SeqAIJ, 3644eede4a3fSMark Adams MatEliminateZeros_SeqAIJ, 36454cc2b5b5SPierre Jolivet MatGetRowSumAbs_SeqAIJ, 364642ce410bSJunchao Zhang NULL, 364742ce410bSJunchao Zhang NULL, 3648fe1fc275SAlexander /*155*/ NULL, 3649fe1fc275SAlexander MatCopyHashToXAIJ_Seq_Hash}; 365017ab2063SBarry Smith 3651ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3652d71ae5a4SJacob Faibussowitsch { 3653bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 365497f1f81fSBarry Smith PetscInt i, nz, n; 3655bef8e0ddSBarry Smith 3656bef8e0ddSBarry Smith PetscFunctionBegin; 3657bef8e0ddSBarry Smith nz = aij->maxnz; 3658d0f46423SBarry Smith n = mat->rmap->n; 3659ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3660bef8e0ddSBarry Smith aij->nz = nz; 3661ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 36623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3663bef8e0ddSBarry Smith } 3664bef8e0ddSBarry Smith 3665a3bb6f32SFande Kong /* 3666ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3667ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3668ddea5d60SJunchao Zhang */ 3669d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3670d71ae5a4SJacob Faibussowitsch { 3671a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3672eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3673eec179cfSJacob Faibussowitsch PetscHashIter tpos; 367425b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 367525b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3676a3bb6f32SFande Kong 3677a3bb6f32SFande Kong PetscFunctionBegin; 3678a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 36794f572ea9SToby Isaac PetscAssertPointer(mapping, 2); 3680a3bb6f32SFande Kong /* use a table */ 3681eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3682a3bb6f32SFande Kong ec = 0; 368325b670f0SStefano Zampini for (i = 0; i < nz; i++) { 368425b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3685eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3686a3bb6f32SFande Kong if (!data) { 3687a3bb6f32SFande Kong /* one based table */ 3688c76ffc5fSJacob Faibussowitsch PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec)); 3689a3bb6f32SFande Kong } 3690a3bb6f32SFande Kong } 3691a3bb6f32SFande Kong /* form array of columns we need */ 36929566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3693eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3694eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3695eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3696eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3697eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3698a3bb6f32SFande Kong gid--; 3699a3bb6f32SFande Kong lid--; 3700a3bb6f32SFande Kong garray[lid] = gid; 3701a3bb6f32SFande Kong } 37029566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3703eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3704c76ffc5fSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1)); 3705a3bb6f32SFande Kong /* compact out the extra columns in B */ 370625b670f0SStefano Zampini for (i = 0; i < nz; i++) { 370725b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3708eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3709a3bb6f32SFande Kong lid--; 371025b670f0SStefano Zampini jj[i] = lid; 3711a3bb6f32SFande Kong } 37129566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3713eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 37149566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 37159566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 37169566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 37173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3718a3bb6f32SFande Kong } 3719a3bb6f32SFande Kong 3720bef8e0ddSBarry Smith /*@ 3721bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3722bef8e0ddSBarry Smith in the matrix. 3723bef8e0ddSBarry Smith 3724bef8e0ddSBarry Smith Input Parameters: 372511a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3726bef8e0ddSBarry Smith - indices - the column indices 3727bef8e0ddSBarry Smith 372815091d37SBarry Smith Level: advanced 372915091d37SBarry Smith 3730bef8e0ddSBarry Smith Notes: 3731bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3732bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 373311a5261eSBarry Smith of the `MatSetValues()` operation. 3734bef8e0ddSBarry Smith 3735bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 373611a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3737bef8e0ddSBarry Smith 373811a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3739bef8e0ddSBarry Smith 3740b9617806SBarry Smith The indices should start with zero, not one. 3741b9617806SBarry Smith 37421cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ` 3743bef8e0ddSBarry Smith @*/ 3744d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3745d71ae5a4SJacob Faibussowitsch { 3746bef8e0ddSBarry Smith PetscFunctionBegin; 37470700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 37484f572ea9SToby Isaac PetscAssertPointer(indices, 2); 3749cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 37503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3751bef8e0ddSBarry Smith } 3752bef8e0ddSBarry Smith 3753ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3754d71ae5a4SJacob Faibussowitsch { 3755be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3756d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3757be6bf707SBarry Smith 3758be6bf707SBarry Smith PetscFunctionBegin; 375928b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3760be6bf707SBarry Smith 3761be6bf707SBarry Smith /* allocate space for values if not already there */ 37624dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3763be6bf707SBarry Smith 3764be6bf707SBarry Smith /* copy values over */ 37659566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 37663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3767be6bf707SBarry Smith } 3768be6bf707SBarry Smith 3769be6bf707SBarry Smith /*@ 377020f4b53cSBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the 3771be6bf707SBarry Smith nonlinear portion. 3772be6bf707SBarry Smith 3773c3339decSBarry Smith Logically Collect 3774be6bf707SBarry Smith 377527430b45SBarry Smith Input Parameter: 377611a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3777be6bf707SBarry Smith 377815091d37SBarry Smith Level: advanced 377915091d37SBarry Smith 37802920cce0SJacob Faibussowitsch Example Usage: 378127430b45SBarry Smith .vb 37822ef1f0ffSBarry Smith Using SNES 378327430b45SBarry Smith Create Jacobian matrix 378427430b45SBarry Smith Set linear terms into matrix 378527430b45SBarry Smith Apply boundary conditions to matrix, at this time matrix must have 378627430b45SBarry Smith final nonzero structure (i.e. setting the nonlinear terms and applying 378727430b45SBarry Smith boundary conditions again will not change the nonzero structure 378827430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 378927430b45SBarry Smith MatStoreValues(mat); 379027430b45SBarry Smith Call SNESSetJacobian() with matrix 379127430b45SBarry Smith In your Jacobian routine 379227430b45SBarry Smith MatRetrieveValues(mat); 379327430b45SBarry Smith Set nonlinear terms in matrix 3794be6bf707SBarry Smith 379527430b45SBarry Smith Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself: 379627430b45SBarry Smith // build linear portion of Jacobian 379727430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 379827430b45SBarry Smith MatStoreValues(mat); 379927430b45SBarry Smith loop over nonlinear iterations 380027430b45SBarry Smith MatRetrieveValues(mat); 380127430b45SBarry Smith // call MatSetValues(mat,...) to set nonliner portion of Jacobian 380227430b45SBarry Smith // call MatAssemblyBegin/End() on matrix 380327430b45SBarry Smith Solve linear system with Jacobian 380427430b45SBarry Smith endloop 380527430b45SBarry Smith .ve 3806be6bf707SBarry Smith 3807be6bf707SBarry Smith Notes: 3808da81f932SPierre Jolivet Matrix must already be assembled before calling this routine 380911a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3810be6bf707SBarry Smith calling this routine. 3811be6bf707SBarry Smith 38120c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 38130c468ba9SBarry Smith and does not allocated additional space. 38140c468ba9SBarry Smith 3815fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()` 3816be6bf707SBarry Smith @*/ 3817d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3818d71ae5a4SJacob Faibussowitsch { 3819be6bf707SBarry Smith PetscFunctionBegin; 38200700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 382128b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 382228b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3823cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 38243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3825be6bf707SBarry Smith } 3826be6bf707SBarry Smith 3827ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3828d71ae5a4SJacob Faibussowitsch { 3829be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3830d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3831be6bf707SBarry Smith 3832be6bf707SBarry Smith PetscFunctionBegin; 383328b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 383428b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3835be6bf707SBarry Smith /* copy values over */ 38369566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 38373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3838be6bf707SBarry Smith } 3839be6bf707SBarry Smith 3840be6bf707SBarry Smith /*@ 384120f4b53cSBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()` 3842be6bf707SBarry Smith 3843c3339decSBarry Smith Logically Collect 3844be6bf707SBarry Smith 38452fe279fdSBarry Smith Input Parameter: 384611a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3847be6bf707SBarry Smith 384815091d37SBarry Smith Level: advanced 384915091d37SBarry Smith 38501cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()` 3851be6bf707SBarry Smith @*/ 3852d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3853d71ae5a4SJacob Faibussowitsch { 3854be6bf707SBarry Smith PetscFunctionBegin; 38550700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 385628b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 385728b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3858cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 38593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3860be6bf707SBarry Smith } 3861be6bf707SBarry Smith 38625d83a8b1SBarry Smith /*@ 386311a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38640d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 386520f4b53cSBarry Smith the user should preallocate the matrix storage by setting the parameter `nz` 386620f4b53cSBarry Smith (or the array `nnz`). 386717ab2063SBarry Smith 3868d083f849SBarry Smith Collective 3869db81eaa0SLois Curfman McInnes 387017ab2063SBarry Smith Input Parameters: 387111a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 387217ab2063SBarry Smith . m - number of rows 387317ab2063SBarry Smith . n - number of columns 387417ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 387551c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38760298fd71SBarry Smith (possibly different for each row) or NULL 387717ab2063SBarry Smith 387817ab2063SBarry Smith Output Parameter: 3879416022c9SBarry Smith . A - the matrix 388017ab2063SBarry Smith 38812ef1f0ffSBarry Smith Options Database Keys: 38822ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 38832ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 38842ef1f0ffSBarry Smith 38852ef1f0ffSBarry Smith Level: intermediate 3886175b88e8SBarry Smith 3887b259b22eSLois Curfman McInnes Notes: 388877433607SBarry Smith It is recommend to use `MatCreateFromOptions()` instead of this routine 388977433607SBarry Smith 38902ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 389149a6f317SBarry Smith 38922ef1f0ffSBarry Smith The `MATSEQAIJ` format, also called 38932ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 38940002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 38952ef1f0ffSBarry Smith either one (as in Fortran) or zero. 389617ab2063SBarry Smith 389720f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 38982ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 389920f4b53cSBarry Smith allocation. 390017ab2063SBarry Smith 3901682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 39024fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3903682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 39046c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 39056c7ebb05SLois Curfman McInnes 39061cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 390717ab2063SBarry Smith @*/ 3908d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3909d71ae5a4SJacob Faibussowitsch { 39103a40ed3dSBarry Smith PetscFunctionBegin; 39119566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 39129566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 39139566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 39149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 39153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3916273d9f13SBarry Smith } 3917273d9f13SBarry Smith 39185d83a8b1SBarry Smith /*@ 3919273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3920273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3921273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3922273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3923273d9f13SBarry Smith 3924d083f849SBarry Smith Collective 3925273d9f13SBarry Smith 3926273d9f13SBarry Smith Input Parameters: 39271c4f3114SJed Brown + B - The matrix 3928273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3929273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39300298fd71SBarry Smith (possibly different for each row) or NULL 3931273d9f13SBarry Smith 39322ef1f0ffSBarry Smith Options Database Keys: 39332ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 39342ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 39352ef1f0ffSBarry Smith 39362ef1f0ffSBarry Smith Level: intermediate 39372ef1f0ffSBarry Smith 3938273d9f13SBarry Smith Notes: 39392ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 394049a6f317SBarry Smith 394111a5261eSBarry Smith The `MATSEQAIJ` format also called 39422ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 3943273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3944273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3945273d9f13SBarry Smith 39462ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 39472ef1f0ffSBarry Smith Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 39482ef1f0ffSBarry Smith allocation. 3949273d9f13SBarry Smith 395011a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3951aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3952aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3953aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3954aa95bbe8SBarry Smith 395511a5261eSBarry Smith Developer Notes: 395611a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3957a96a251dSBarry Smith entries or columns indices 3958a96a251dSBarry Smith 3959273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3960273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3961273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3962273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3963273d9f13SBarry Smith 39641cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3965db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3966273d9f13SBarry Smith @*/ 3967d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3968d71ae5a4SJacob Faibussowitsch { 3969a23d5eceSKris Buschelman PetscFunctionBegin; 39706ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39716ba663aaSJed Brown PetscValidType(B, 1); 3972cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 39733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3974a23d5eceSKris Buschelman } 3975a23d5eceSKris Buschelman 3976d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3977d71ae5a4SJacob Faibussowitsch { 3978ad79cf63SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 39792576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 398097f1f81fSBarry Smith PetscInt i; 3981273d9f13SBarry Smith 3982273d9f13SBarry Smith PetscFunctionBegin; 3983ad79cf63SBarry Smith if (B->hash_active) { 3984aea10558SJacob Faibussowitsch B->ops[0] = b->cops; 3985ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 3986ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 3987ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 3988ad79cf63SBarry Smith } 39892576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3990a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3991c461c341SBarry Smith skipallocation = PETSC_TRUE; 3992c461c341SBarry Smith nz = 0; 3993c461c341SBarry Smith } 39949566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39959566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3996899cda47SBarry Smith 3997435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 399808401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 39999f0612e4SBarry Smith if (nnz) { 4000d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 400108401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 400208401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 4003b73539f3SBarry Smith } 4004b73539f3SBarry Smith } 4005b73539f3SBarry Smith 4006273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 4007ab93d7beSBarry Smith if (!skipallocation) { 40084dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 4009071fcb05SBarry Smith if (!b->ilen) { 4010071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 40119566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 4012071fcb05SBarry Smith } else { 40139566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 40142ee49352SLisandro Dalcin } 4015aa624791SPierre Jolivet if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); 4016273d9f13SBarry Smith if (!nnz) { 4017435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 4018c62bd62aSJed Brown else if (nz < 0) nz = 1; 40195d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 4020d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 4021c43c4a61SBarry Smith PetscCall(PetscIntMultError(nz, B->rmap->n, &nz)); 4022273d9f13SBarry Smith } else { 4023c73702f5SBarry Smith PetscInt64 nz64 = 0; 40249371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 40259371c9d4SSatish Balay b->imax[i] = nnz[i]; 40269371c9d4SSatish Balay nz64 += nnz[i]; 40279371c9d4SSatish Balay } 40289566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 4029273d9f13SBarry Smith } 4030ab93d7beSBarry Smith 4031273d9f13SBarry Smith /* allocate the matrix space */ 40329566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 40339f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscInt), (void **)&b->j)); 40349f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(B->rmap->n + 1, sizeof(PetscInt), (void **)&b->i)); 40359f0612e4SBarry Smith b->free_ij = PETSC_TRUE; 4036396832f4SHong Zhang if (B->structure_only) { 40379f0612e4SBarry Smith b->free_a = PETSC_FALSE; 4038396832f4SHong Zhang } else { 40399f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscScalar), (void **)&b->a)); 40409f0612e4SBarry Smith b->free_a = PETSC_TRUE; 4041396832f4SHong Zhang } 4042bfeeae90SHong Zhang b->i[0] = 0; 4043ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4044c461c341SBarry Smith } else { 4045e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4046e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4047c461c341SBarry Smith } 4048273d9f13SBarry Smith 4049846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4050846b4da1SFande Kong /* reserve user-requested sparsity */ 40519566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4052846b4da1SFande Kong } 4053846b4da1SFande Kong 4054273d9f13SBarry Smith b->nz = 0; 4055273d9f13SBarry Smith b->maxnz = nz; 4056273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40571baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4058cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4059cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40605519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40615519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40625519a089SJose E. Roman */ 40635519a089SJose E. Roman B->nonzerostate++; 40643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4065273d9f13SBarry Smith } 4066273d9f13SBarry Smith 4067ba38deedSJacob Faibussowitsch static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4068d71ae5a4SJacob Faibussowitsch { 4069846b4da1SFande Kong Mat_SeqAIJ *a; 4070a5bbaf83SFande Kong PetscInt i; 40711f14be2bSBarry Smith PetscBool skipreset; 4072846b4da1SFande Kong 4073846b4da1SFande Kong PetscFunctionBegin; 4074846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 407514d0e64fSAlex Lindsay 407614d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 40773ba16761SJacob Faibussowitsch if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS); 407814d0e64fSAlex Lindsay 4079846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40802c814fdeSFande Kong /* if no saved info, we error out */ 408128b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40822c814fdeSFande Kong 40831f14be2bSBarry Smith PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40842c814fdeSFande Kong 40851f14be2bSBarry Smith PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset)); 40861f14be2bSBarry Smith if (!skipreset) { 40879566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40889566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4089846b4da1SFande Kong a->i[0] = 0; 4090ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4091846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4092846b4da1SFande Kong a->nz = 0; 4093846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4094846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4095846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4096846b4da1SFande Kong A->assembled = PETSC_FALSE; 40971f14be2bSBarry Smith } 40983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4099846b4da1SFande Kong } 4100846b4da1SFande Kong 410158d36128SBarry Smith /*@ 410211a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4103a1661176SMatthew Knepley 4104a1661176SMatthew Knepley Input Parameters: 4105a1661176SMatthew Knepley + B - the matrix 4106d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero) 4107d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row 4108d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided 4109a1661176SMatthew Knepley 4110a1661176SMatthew Knepley Level: developer 4111a1661176SMatthew Knepley 41126a9b8d82SBarry Smith Notes: 41132ef1f0ffSBarry Smith The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 411458d36128SBarry Smith 41156a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 41166a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 41176a9b8d82SBarry Smith 41186a9b8d82SBarry Smith Developer Notes: 41192ef1f0ffSBarry Smith An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and 41202ef1f0ffSBarry Smith then just copies the `v` values directly with `PetscMemcpy()`. 41216a9b8d82SBarry Smith 412211a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 41236a9b8d82SBarry Smith 4124fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()` 4125a1661176SMatthew Knepley @*/ 4126d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4127d71ae5a4SJacob Faibussowitsch { 4128a1661176SMatthew Knepley PetscFunctionBegin; 41290700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 41306ba663aaSJed Brown PetscValidType(B, 1); 4131cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 41323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4133a1661176SMatthew Knepley } 4134a1661176SMatthew Knepley 4135ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4136d71ae5a4SJacob Faibussowitsch { 4137a1661176SMatthew Knepley PetscInt i; 4138a1661176SMatthew Knepley PetscInt m, n; 4139a1661176SMatthew Knepley PetscInt nz; 41406a9b8d82SBarry Smith PetscInt *nnz; 4141a1661176SMatthew Knepley 4142a1661176SMatthew Knepley PetscFunctionBegin; 4143aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4144779a8d59SSatish Balay 41459566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41469566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4147779a8d59SSatish Balay 41489566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4150a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4151b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 415208401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4153a1661176SMatthew Knepley nnz[i] = nz; 4154a1661176SMatthew Knepley } 41559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41569566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4157a1661176SMatthew Knepley 41588e3a54c0SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES)); 4159a1661176SMatthew Knepley 41609566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41619566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4162a1661176SMatthew Knepley 41639566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 41643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4165a1661176SMatthew Knepley } 4166a1661176SMatthew Knepley 4167ad7e164aSPierre Jolivet /*@ 41682ef1f0ffSBarry Smith MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`. 4169ad7e164aSPierre Jolivet 4170ad7e164aSPierre Jolivet Input Parameters: 4171ad7e164aSPierre Jolivet + A - left-hand side matrix 4172ad7e164aSPierre Jolivet . B - right-hand side matrix 417311a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4174ad7e164aSPierre Jolivet 4175ad7e164aSPierre Jolivet Output Parameter: 41762ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B` 4177ad7e164aSPierre Jolivet 4178ad7e164aSPierre Jolivet Level: intermediate 4179ad7e164aSPierre Jolivet 418011a5261eSBarry Smith Note: 418111a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4182ad7e164aSPierre Jolivet 41831cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4184ad7e164aSPierre Jolivet @*/ 4185d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4186d71ae5a4SJacob Faibussowitsch { 4187ad7e164aSPierre Jolivet PetscFunctionBegin; 4188ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4189ad7e164aSPierre Jolivet PetscValidType(A, 1); 4190ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4191ad7e164aSPierre Jolivet PetscValidType(B, 2); 41924f572ea9SToby Isaac PetscAssertPointer(C, 4); 4193ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4194ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4195ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4196ad7e164aSPierre Jolivet } 4197cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 41983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4199ad7e164aSPierre Jolivet } 4200ad7e164aSPierre Jolivet 4201ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4202d71ae5a4SJacob Faibussowitsch { 4203ad7e164aSPierre Jolivet Mat newmat; 4204ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4205ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4206ad7e164aSPierre Jolivet PetscScalar *v; 4207fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4208ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4209ad7e164aSPierre Jolivet PetscBool flg; 4210ad7e164aSPierre Jolivet 4211ad7e164aSPierre Jolivet PetscFunctionBegin; 421228b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 421328b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 421428b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 421528b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 42169566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 421728b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4218aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4219ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 42209566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 42219566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 42229566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 42239566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4224ad7e164aSPierre Jolivet i[0] = 0; 4225ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4226ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4227ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4228ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4229ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4230ad7e164aSPierre Jolivet } 4231ad7e164aSPierre Jolivet } 4232ad7e164aSPierre Jolivet } 42339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4234ad7e164aSPierre Jolivet *C = newmat; 42359566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4236ad7e164aSPierre Jolivet nnz = 0; 4237ad7e164aSPierre Jolivet } 42389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4241ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4242ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4243ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4244ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4245ad7e164aSPierre Jolivet } 4246ad7e164aSPierre Jolivet } 4247ad7e164aSPierre Jolivet } 42489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 42513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4252ad7e164aSPierre Jolivet } 4253ad7e164aSPierre Jolivet 4254c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4255af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4256170fe5c8SBarry Smith 4257170fe5c8SBarry Smith /* 4258170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4259170fe5c8SBarry Smith 4260170fe5c8SBarry Smith n p p 42612da392ccSBarry Smith [ ] [ ] [ ] 42622da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42632da392ccSBarry Smith [ ] [ ] [ ] 4264170fe5c8SBarry Smith 4265170fe5c8SBarry Smith */ 4266d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4267d71ae5a4SJacob Faibussowitsch { 4268170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4269170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4270170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 427186214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4272170fe5c8SBarry Smith const PetscInt *ii, *idx; 4273170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4274170fe5c8SBarry Smith PetscScalar *c, *c_q; 427586214ceeSStefano Zampini PetscInt clda = sub_c->lda; 427686214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4277170fe5c8SBarry Smith 4278170fe5c8SBarry Smith PetscFunctionBegin; 4279d0f46423SBarry Smith m = A->rmap->n; 4280d0f46423SBarry Smith n = A->cmap->n; 4281d0f46423SBarry Smith p = B->cmap->n; 4282170fe5c8SBarry Smith a = sub_a->v; 4283170fe5c8SBarry Smith b = sub_b->a; 4284170fe5c8SBarry Smith c = sub_c->v; 428586214ceeSStefano Zampini if (clda == m) { 42869566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 428786214ceeSStefano Zampini } else { 428886214ceeSStefano Zampini for (j = 0; j < p; j++) 42899371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 429086214ceeSStefano Zampini } 4291170fe5c8SBarry Smith ii = sub_b->i; 4292170fe5c8SBarry Smith idx = sub_b->j; 4293170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4294170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4295170fe5c8SBarry Smith while (q-- > 0) { 429686214ceeSStefano Zampini c_q = c + clda * (*idx); 429786214ceeSStefano Zampini a_q = a + alda * i; 4298854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4299170fe5c8SBarry Smith idx++; 4300170fe5c8SBarry Smith b++; 4301170fe5c8SBarry Smith } 4302170fe5c8SBarry Smith } 43033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4304170fe5c8SBarry Smith } 4305170fe5c8SBarry Smith 4306d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4307d71ae5a4SJacob Faibussowitsch { 4308d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 430986214ceeSStefano Zampini PetscBool cisdense; 4310170fe5c8SBarry Smith 4311170fe5c8SBarry Smith PetscFunctionBegin; 431208401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 43139566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 43149566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 4315d5e393b6SSuyash Tandon PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, "")); 431648a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 43179566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4318d73949e8SHong Zhang 43194222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 43203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4321170fe5c8SBarry Smith } 4322170fe5c8SBarry Smith 43230bad9183SKris Buschelman /*MC 4324fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43250bad9183SKris Buschelman based on compressed sparse row format. 43260bad9183SKris Buschelman 43272ef1f0ffSBarry Smith Options Database Key: 43280bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43290bad9183SKris Buschelman 43300bad9183SKris Buschelman Level: beginner 43310bad9183SKris Buschelman 43320cd7f59aSBarry Smith Notes: 43332ef1f0ffSBarry Smith `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values, 43340cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43350cd7f59aSBarry Smith in the matrix 43360cd7f59aSBarry Smith 433711a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 433811a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43390cd7f59aSBarry Smith 434011a5261eSBarry Smith Developer Note: 43412ef1f0ffSBarry Smith It would be nice if all matrix formats supported passing `NULL` in for the numerical values 43420cd7f59aSBarry Smith 43431cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43440bad9183SKris Buschelman M*/ 43450bad9183SKris Buschelman 4346ccd284c7SBarry Smith /*MC 4347ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4348ccd284c7SBarry Smith 434911a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 435011a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 435111a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4352ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4353ccd284c7SBarry Smith the above preallocation routines for simplicity. 4354ccd284c7SBarry Smith 43552ef1f0ffSBarry Smith Options Database Key: 435611a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4357ccd284c7SBarry Smith 43582ef1f0ffSBarry Smith Level: beginner 43592ef1f0ffSBarry Smith 436011a5261eSBarry Smith Note: 436111a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4362ccd284c7SBarry Smith enough exist. 4363ccd284c7SBarry Smith 43641cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4365ccd284c7SBarry Smith M*/ 4366ccd284c7SBarry Smith 4367ccd284c7SBarry Smith /*MC 4368ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4369ccd284c7SBarry Smith 43702ef1f0ffSBarry Smith Options Database Key: 43712ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 43722ef1f0ffSBarry Smith 43732ef1f0ffSBarry Smith Level: beginner 43742ef1f0ffSBarry Smith 43752ef1f0ffSBarry Smith Note: 437611a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 437711a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 437811a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4379ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4380ccd284c7SBarry Smith the above preallocation routines for simplicity. 4381ccd284c7SBarry Smith 43821cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4383ccd284c7SBarry Smith M*/ 4384ccd284c7SBarry Smith 43857906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43867906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43877906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43887906f579SHong Zhang #endif 4389d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4390d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4391d24d4204SJose E. Roman #endif 43927906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43937906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43947906f579SHong Zhang #endif 43957906f579SHong Zhang 4396d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4397c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43984222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43997906f579SHong Zhang 44008c778c55SBarry Smith /*@C 440111a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 44028c778c55SBarry Smith 44038c778c55SBarry Smith Not Collective 44048c778c55SBarry Smith 44058c778c55SBarry Smith Input Parameter: 4406fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44078c778c55SBarry Smith 44088c778c55SBarry Smith Output Parameter: 44098c778c55SBarry Smith . array - pointer to the data 44108c778c55SBarry Smith 44118c778c55SBarry Smith Level: intermediate 44128c778c55SBarry Smith 4413fe59aa6dSJacob Faibussowitsch Fortran Notes: 44140ab4885dSBarry Smith `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()` 44150ab4885dSBarry Smith 44161cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 44178c778c55SBarry Smith @*/ 44185d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar *array[]) 4419d71ae5a4SJacob Faibussowitsch { 4420d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44218c778c55SBarry Smith 44228c778c55SBarry Smith PetscFunctionBegin; 4423d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44249566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4425d67d9f35SJunchao Zhang } else { 4426d67d9f35SJunchao Zhang *array = aij->a; 4427d67d9f35SJunchao Zhang } 44283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4429d67d9f35SJunchao Zhang } 4430d67d9f35SJunchao Zhang 4431d67d9f35SJunchao Zhang /*@C 443211a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4433d67d9f35SJunchao Zhang 4434d67d9f35SJunchao Zhang Not Collective 4435d67d9f35SJunchao Zhang 4436d67d9f35SJunchao Zhang Input Parameters: 4437fe59aa6dSJacob Faibussowitsch + A - a `MATSEQAIJ` matrix 4438d67d9f35SJunchao Zhang - array - pointer to the data 4439d67d9f35SJunchao Zhang 4440d67d9f35SJunchao Zhang Level: intermediate 4441d67d9f35SJunchao Zhang 4442fe59aa6dSJacob Faibussowitsch Fortran Notes: 44430ab4885dSBarry Smith `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()` 44440ab4885dSBarry Smith 44451cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4446d67d9f35SJunchao Zhang @*/ 44475d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar *array[]) 4448d71ae5a4SJacob Faibussowitsch { 4449d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4450d67d9f35SJunchao Zhang 4451d67d9f35SJunchao Zhang PetscFunctionBegin; 4452d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44539566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4454d67d9f35SJunchao Zhang } else { 4455d67d9f35SJunchao Zhang *array = NULL; 4456d67d9f35SJunchao Zhang } 44579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44589566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44608c778c55SBarry Smith } 44618c778c55SBarry Smith 446221e72a00SBarry Smith /*@C 446311a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44648f1ea47aSStefano Zampini 44650ab4885dSBarry Smith Not Collective; No Fortran Support 44668f1ea47aSStefano Zampini 44678f1ea47aSStefano Zampini Input Parameter: 4468fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44698f1ea47aSStefano Zampini 44708f1ea47aSStefano Zampini Output Parameter: 44718f1ea47aSStefano Zampini . array - pointer to the data 44728f1ea47aSStefano Zampini 44738f1ea47aSStefano Zampini Level: intermediate 44748f1ea47aSStefano Zampini 44751cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44768f1ea47aSStefano Zampini @*/ 44775d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar *array[]) 4478d71ae5a4SJacob Faibussowitsch { 4479d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44808f1ea47aSStefano Zampini 44818f1ea47aSStefano Zampini PetscFunctionBegin; 4482d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44839566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4484d67d9f35SJunchao Zhang } else { 4485d67d9f35SJunchao Zhang *array = aij->a; 4486d67d9f35SJunchao Zhang } 44873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44888f1ea47aSStefano Zampini } 44898f1ea47aSStefano Zampini 44908f1ea47aSStefano Zampini /*@C 449111a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44928f1ea47aSStefano Zampini 44930ab4885dSBarry Smith Not Collective; No Fortran Support 44948f1ea47aSStefano Zampini 44958f1ea47aSStefano Zampini Input Parameter: 4496fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44978f1ea47aSStefano Zampini 44988f1ea47aSStefano Zampini Output Parameter: 44998f1ea47aSStefano Zampini . array - pointer to the data 45008f1ea47aSStefano Zampini 45018f1ea47aSStefano Zampini Level: intermediate 45028f1ea47aSStefano Zampini 45031cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45048f1ea47aSStefano Zampini @*/ 45055d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar *array[]) 4506d71ae5a4SJacob Faibussowitsch { 4507d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 45088f1ea47aSStefano Zampini 45098f1ea47aSStefano Zampini PetscFunctionBegin; 4510d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 45119566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4512d67d9f35SJunchao Zhang } else { 4513d67d9f35SJunchao Zhang *array = NULL; 4514d67d9f35SJunchao Zhang } 45153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4516d67d9f35SJunchao Zhang } 4517d67d9f35SJunchao Zhang 4518d67d9f35SJunchao Zhang /*@C 451911a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4520d67d9f35SJunchao Zhang 45210ab4885dSBarry Smith Not Collective; No Fortran Support 4522d67d9f35SJunchao Zhang 4523d67d9f35SJunchao Zhang Input Parameter: 4524fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 4525d67d9f35SJunchao Zhang 4526d67d9f35SJunchao Zhang Output Parameter: 4527d67d9f35SJunchao Zhang . array - pointer to the data 4528d67d9f35SJunchao Zhang 4529d67d9f35SJunchao Zhang Level: intermediate 4530d67d9f35SJunchao Zhang 45311cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4532d67d9f35SJunchao Zhang @*/ 45335d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar *array[]) 4534d71ae5a4SJacob Faibussowitsch { 4535d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4536d67d9f35SJunchao Zhang 4537d67d9f35SJunchao Zhang PetscFunctionBegin; 4538d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45399566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4540d67d9f35SJunchao Zhang } else { 4541d67d9f35SJunchao Zhang *array = aij->a; 4542d67d9f35SJunchao Zhang } 45439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45449566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 45453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4546d67d9f35SJunchao Zhang } 4547d67d9f35SJunchao Zhang 4548d67d9f35SJunchao Zhang /*@C 4549d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4550d67d9f35SJunchao Zhang 45510ab4885dSBarry Smith Not Collective; No Fortran Support 4552d67d9f35SJunchao Zhang 4553d67d9f35SJunchao Zhang Input Parameter: 4554fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix 4555d67d9f35SJunchao Zhang 4556d67d9f35SJunchao Zhang Output Parameter: 4557d67d9f35SJunchao Zhang . array - pointer to the data 4558d67d9f35SJunchao Zhang 4559d67d9f35SJunchao Zhang Level: intermediate 4560d67d9f35SJunchao Zhang 45611cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4562d67d9f35SJunchao Zhang @*/ 45635d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar *array[]) 4564d71ae5a4SJacob Faibussowitsch { 4565d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4566d67d9f35SJunchao Zhang 4567d67d9f35SJunchao Zhang PetscFunctionBegin; 4568d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45699566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4570d67d9f35SJunchao Zhang } else { 4571d67d9f35SJunchao Zhang *array = NULL; 4572d67d9f35SJunchao Zhang } 45733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45748f1ea47aSStefano Zampini } 45758f1ea47aSStefano Zampini 45768f1ea47aSStefano Zampini /*@C 457711a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45787ee59b9bSJunchao Zhang 45790ab4885dSBarry Smith Not Collective; No Fortran Support 45807ee59b9bSJunchao Zhang 45817ee59b9bSJunchao Zhang Input Parameter: 458211a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45837ee59b9bSJunchao Zhang 45847ee59b9bSJunchao Zhang Output Parameters: 45857ee59b9bSJunchao Zhang + i - row map array of the matrix 45867ee59b9bSJunchao Zhang . j - column index array of the matrix 45877ee59b9bSJunchao Zhang . a - data array of the matrix 4588fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays 45897ee59b9bSJunchao Zhang 4590fe59aa6dSJacob Faibussowitsch Level: developer 45912ef1f0ffSBarry Smith 45927ee59b9bSJunchao Zhang Notes: 45932ef1f0ffSBarry Smith Any of the output parameters can be `NULL`, in which case the corresponding value is not returned. 45947ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45957ee59b9bSJunchao Zhang 45967ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45972ef1f0ffSBarry Smith If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix. 45987ee59b9bSJunchao Zhang 45991cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 46007ee59b9bSJunchao Zhang @*/ 46015d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt *i[], const PetscInt *j[], PetscScalar *a[], PetscMemType *mtype) 4602d71ae5a4SJacob Faibussowitsch { 46037ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 46047ee59b9bSJunchao Zhang 46057ee59b9bSJunchao Zhang PetscFunctionBegin; 46067ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 46077ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 46087ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 46097ee59b9bSJunchao Zhang } else { 46107ee59b9bSJunchao Zhang if (i) *i = aij->i; 46117ee59b9bSJunchao Zhang if (j) *j = aij->j; 46127ee59b9bSJunchao Zhang if (a) *a = aij->a; 46137ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 46147ee59b9bSJunchao Zhang } 46153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 46167ee59b9bSJunchao Zhang } 46177ee59b9bSJunchao Zhang 4618cc4c1da9SBarry Smith /*@ 461921e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 462021e72a00SBarry Smith 462121e72a00SBarry Smith Not Collective 462221e72a00SBarry Smith 462321e72a00SBarry Smith Input Parameter: 4624fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 462521e72a00SBarry Smith 462621e72a00SBarry Smith Output Parameter: 462721e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 462821e72a00SBarry Smith 462921e72a00SBarry Smith Level: intermediate 463021e72a00SBarry Smith 46311cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 463221e72a00SBarry Smith @*/ 4633d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4634d71ae5a4SJacob Faibussowitsch { 463521e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 463621e72a00SBarry Smith 463721e72a00SBarry Smith PetscFunctionBegin; 463821e72a00SBarry Smith *nz = aij->rmax; 46393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 464021e72a00SBarry Smith } 464121e72a00SBarry Smith 464249abdd8aSBarry Smith static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void **data) 46432c4ab24aSJunchao Zhang { 464449abdd8aSBarry Smith MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)*data; 46454d86920dSPierre Jolivet 46462c4ab24aSJunchao Zhang PetscFunctionBegin; 46472c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->perm)); 46482c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->jmap)); 46492c4ab24aSJunchao Zhang PetscCall(PetscFree(coo)); 46502c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS); 46512c4ab24aSJunchao Zhang } 46522c4ab24aSJunchao Zhang 4653d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4654d71ae5a4SJacob Faibussowitsch { 4655394ed5ebSJunchao Zhang MPI_Comm comm; 4656394ed5ebSJunchao Zhang PetscInt *i, *j; 46570d88f7f4SJunchao Zhang PetscInt M, N, row, iprev; 4658394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4659394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4660394ed5ebSJunchao Zhang PetscInt *Aj; 4661394ed5ebSJunchao Zhang PetscScalar *Aa; 4662f4f49eeaSPierre Jolivet Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)mat->data; 4663cbc6b225SStefano Zampini MatType rtype; 4664394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 46652c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 46660d88f7f4SJunchao Zhang PetscBool isorted; 46679f0612e4SBarry Smith PetscBool hypre; 46689f0612e4SBarry Smith const char *name; 4669394ed5ebSJunchao Zhang 4670394ed5ebSJunchao Zhang PetscFunctionBegin; 46719566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46729566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4673e8729f6fSJunchao Zhang i = coo_i; 4674e8729f6fSJunchao Zhang j = coo_j; 46759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 46760d88f7f4SJunchao Zhang 46770d88f7f4SJunchao Zhang /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */ 46780d88f7f4SJunchao Zhang isorted = PETSC_TRUE; 46790d88f7f4SJunchao Zhang iprev = PETSC_INT_MIN; 46800d88f7f4SJunchao Zhang for (k = 0; k < coo_n; k++) { 4681394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 46820d88f7f4SJunchao Zhang if (isorted) { 46830d88f7f4SJunchao Zhang if (i[k] < iprev) isorted = PETSC_FALSE; 46840d88f7f4SJunchao Zhang else iprev = i[k]; 46850d88f7f4SJunchao Zhang } 4686394ed5ebSJunchao Zhang perm[k] = k; 4687394ed5ebSJunchao Zhang } 4688394ed5ebSJunchao Zhang 46890d88f7f4SJunchao Zhang /* Sort by row if not already */ 46900d88f7f4SJunchao Zhang if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 4691651b1cf9SStefano Zampini 4692651b1cf9SStefano Zampini /* Advance k to the first row with a non-negative index */ 4693651b1cf9SStefano Zampini for (k = 0; k < coo_n; k++) 46949371c9d4SSatish Balay if (i[k] >= 0) break; 4695394ed5ebSJunchao Zhang nneg = k; 46969566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4697394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 469835cb6cd3SPierre Jolivet jmap++; /* Inc jmap by 1 for convenience */ 4699394ed5ebSJunchao Zhang 47009f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(M + 1, sizeof(PetscInt), (void **)&Ai)); /* CSR of A */ 47019f0612e4SBarry Smith PetscCall(PetscArrayzero(Ai, M + 1)); 47029f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(coo_n - nneg, sizeof(PetscInt), (void **)&Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4703394ed5ebSJunchao Zhang 4704651b1cf9SStefano Zampini PetscCall(PetscObjectGetName((PetscObject)mat, &name)); 4705651b1cf9SStefano Zampini PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre)); 4706651b1cf9SStefano Zampini 4707394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 470835cb6cd3SPierre Jolivet Ai++; /* Inc by 1 for convenience */ 4709394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4710394ed5ebSJunchao Zhang while (k < coo_n) { 47110d88f7f4SJunchao Zhang PetscBool strictly_sorted; // this row is strictly sorted? 47120d88f7f4SJunchao Zhang PetscInt jprev; 47130d88f7f4SJunchao Zhang 47140d88f7f4SJunchao Zhang /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */ 4715394ed5ebSJunchao Zhang row = i[k]; 47160d88f7f4SJunchao Zhang start = k; 47170d88f7f4SJunchao Zhang jprev = PETSC_INT_MIN; 47180d88f7f4SJunchao Zhang strictly_sorted = PETSC_TRUE; 47190d88f7f4SJunchao Zhang while (k < coo_n && i[k] == row) { 47200d88f7f4SJunchao Zhang if (strictly_sorted) { 47210d88f7f4SJunchao Zhang if (j[k] <= jprev) strictly_sorted = PETSC_FALSE; 47220d88f7f4SJunchao Zhang else jprev = j[k]; 47230d88f7f4SJunchao Zhang } 47240d88f7f4SJunchao Zhang k++; 47250d88f7f4SJunchao Zhang } 4726394ed5ebSJunchao Zhang end = k; 47270d88f7f4SJunchao Zhang 4728651b1cf9SStefano Zampini /* hack for HYPRE: swap min column to diag so that diagonal values will go first */ 4729651b1cf9SStefano Zampini if (hypre) { 47301690c2aeSBarry Smith PetscInt minj = PETSC_INT_MAX; 4731651b1cf9SStefano Zampini PetscBool hasdiag = PETSC_FALSE; 47320d88f7f4SJunchao Zhang 47330d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to swap the first and the diag 47340d88f7f4SJunchao Zhang PetscCount tmp; 47350d88f7f4SJunchao Zhang for (p = start; p < end; p++) { 47360d88f7f4SJunchao Zhang if (j[p] == row && p != start) { 4737*1c265611SJunchao Zhang j[p] = j[start]; // swap j[], so that the diagonal value will go first (manipulated by perm[]) 47380d88f7f4SJunchao Zhang j[start] = row; 47390d88f7f4SJunchao Zhang tmp = perm[start]; 4740*1c265611SJunchao Zhang perm[start] = perm[p]; // also swap perm[] so we can save the call to PetscSortIntWithCountArray() below 47410d88f7f4SJunchao Zhang perm[p] = tmp; 47420d88f7f4SJunchao Zhang break; 47430d88f7f4SJunchao Zhang } 47440d88f7f4SJunchao Zhang } 47450d88f7f4SJunchao Zhang } else { 4746651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4747651b1cf9SStefano Zampini hasdiag = (PetscBool)(hasdiag || (j[p] == row)); 4748651b1cf9SStefano Zampini minj = PetscMin(minj, j[p]); 4749651b1cf9SStefano Zampini } 47500d88f7f4SJunchao Zhang 4751651b1cf9SStefano Zampini if (hasdiag) { 4752651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4753651b1cf9SStefano Zampini if (j[p] == minj) j[p] = row; 4754651b1cf9SStefano Zampini else if (j[p] == row) j[p] = minj; 4755651b1cf9SStefano Zampini } 4756651b1cf9SStefano Zampini } 4757651b1cf9SStefano Zampini } 47580d88f7f4SJunchao Zhang } 4759*1c265611SJunchao Zhang // sort by columns in a row. perm[] indicates their original order 47600d88f7f4SJunchao Zhang if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4761651b1cf9SStefano Zampini 47620d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q 47630d88f7f4SJunchao Zhang for (p = start; p < end; p++, q++) { 47640d88f7f4SJunchao Zhang Aj[q] = j[p]; 47650d88f7f4SJunchao Zhang jmap[q] = 1; 47660d88f7f4SJunchao Zhang } 47676497c311SBarry Smith PetscCall(PetscIntCast(end - start, Ai + row)); 47680d88f7f4SJunchao Zhang nnz += Ai[row]; // q is already advanced 47690d88f7f4SJunchao Zhang } else { 4770394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4771394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4772651b1cf9SStefano Zampini jmap[q] = 1; /* Number of repeats of this nonzero entry */ 4773394ed5ebSJunchao Zhang Ai[row] = 1; 4774394ed5ebSJunchao Zhang nnz++; 4775394ed5ebSJunchao Zhang 4776394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4777394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4778394ed5ebSJunchao Zhang q++; 4779394ed5ebSJunchao Zhang jmap[q] = 1; 4780394ed5ebSJunchao Zhang Aj[q] = j[p]; 4781394ed5ebSJunchao Zhang Ai[row]++; 4782394ed5ebSJunchao Zhang nnz++; 4783394ed5ebSJunchao Zhang } else { 4784394ed5ebSJunchao Zhang jmap[q]++; 4785394ed5ebSJunchao Zhang } 4786394ed5ebSJunchao Zhang } 4787394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4788394ed5ebSJunchao Zhang } 47890d88f7f4SJunchao Zhang } 47900d88f7f4SJunchao Zhang 4791394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4792394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 47930d88f7f4SJunchao Zhang jmap--; // Back to the beginning of jmap[] 4794394ed5ebSJunchao Zhang jmap[0] = 0; 4795394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 47960d88f7f4SJunchao Zhang 47979f0612e4SBarry Smith if (nnz < coo_n - nneg) { /* Reallocate with actual number of unique nonzeros */ 4798394ed5ebSJunchao Zhang PetscCount *jmap_new; 4799394ed5ebSJunchao Zhang PetscInt *Aj_new; 4800394ed5ebSJunchao Zhang 48019566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 48029566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 48039566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4804394ed5ebSJunchao Zhang jmap = jmap_new; 4805394ed5ebSJunchao Zhang 48069f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscInt), (void **)&Aj_new)); 48079566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 48089f0612e4SBarry Smith PetscCall(PetscShmgetDeallocateArray((void **)&Aj)); 4809394ed5ebSJunchao Zhang Aj = Aj_new; 4810394ed5ebSJunchao Zhang } 4811394ed5ebSJunchao Zhang 4812394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4813394ed5ebSJunchao Zhang PetscCount *perm_new; 4814cbc6b225SStefano Zampini 48159566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 48169566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 48179566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4818394ed5ebSJunchao Zhang perm = perm_new; 4819394ed5ebSJunchao Zhang } 4820394ed5ebSJunchao Zhang 48219566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 48229f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscScalar), (void **)&Aa)); 48239f0612e4SBarry Smith PetscCall(PetscArrayzero(Aa, nnz)); 48249566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4825394ed5ebSJunchao Zhang 4826394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 48272c4ab24aSJunchao Zhang 48282c4ab24aSJunchao Zhang // Put the COO struct in a container and then attach that to the matrix 48292c4ab24aSJunchao Zhang PetscCall(PetscMalloc1(1, &coo)); 48306497c311SBarry Smith PetscCall(PetscIntCast(nnz, &coo->nz)); 48312c4ab24aSJunchao Zhang coo->n = coo_n; 48322c4ab24aSJunchao Zhang coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again 48332c4ab24aSJunchao Zhang coo->jmap = jmap; // of length nnz+1 48342c4ab24aSJunchao Zhang coo->perm = perm; 483503e76207SPierre Jolivet PetscCall(PetscObjectContainerCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", coo, MatCOOStructDestroy_SeqAIJ)); 48363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4837394ed5ebSJunchao Zhang } 4838394ed5ebSJunchao Zhang 4839d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4840d71ae5a4SJacob Faibussowitsch { 4841394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4842394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 48432c4ab24aSJunchao Zhang PetscCount *perm, *jmap; 4844394ed5ebSJunchao Zhang PetscScalar *Aa; 48452c4ab24aSJunchao Zhang PetscContainer container; 48462c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 4847394ed5ebSJunchao Zhang 4848394ed5ebSJunchao Zhang PetscFunctionBegin; 48492c4ab24aSJunchao Zhang PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container)); 48502c4ab24aSJunchao Zhang PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix"); 48512c4ab24aSJunchao Zhang PetscCall(PetscContainerGetPointer(container, (void **)&coo)); 48522c4ab24aSJunchao Zhang perm = coo->perm; 48532c4ab24aSJunchao Zhang jmap = coo->jmap; 48549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4855394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4856b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4857b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4858b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4859394ed5ebSJunchao Zhang } 48609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 48613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4862394ed5ebSJunchao Zhang } 4863394ed5ebSJunchao Zhang 486434b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48655063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 486602fe1965SBarry Smith #endif 4867d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4868d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *); 4869d5e393b6SSuyash Tandon #endif 48703d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48715063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 48723d0639e7SStefano Zampini #endif 487302fe1965SBarry Smith 4874d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4875d71ae5a4SJacob Faibussowitsch { 4876273d9f13SBarry Smith Mat_SeqAIJ *b; 487738baddfdSBarry Smith PetscMPIInt size; 4878273d9f13SBarry Smith 4879273d9f13SBarry Smith PetscFunctionBegin; 48809566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 488108401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4882273d9f13SBarry Smith 48834dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 48842205254eSKarl Rupp 4885b0a32e0cSBarry Smith B->data = (void *)b; 4886aea10558SJacob Faibussowitsch B->ops[0] = MatOps_Values; 4887071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 48882205254eSKarl Rupp 4889f4259b30SLisandro Dalcin b->row = NULL; 4890f4259b30SLisandro Dalcin b->col = NULL; 4891f4259b30SLisandro Dalcin b->icol = NULL; 4892b810aeb4SBarry Smith b->reallocs = 0; 489336db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4894f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4895416022c9SBarry Smith b->nonew = 0; 4896f4259b30SLisandro Dalcin b->diag = NULL; 4897f4259b30SLisandro Dalcin b->solve_work = NULL; 4898f4259b30SLisandro Dalcin B->spptr = NULL; 4899f4259b30SLisandro Dalcin b->saved_values = NULL; 4900f4259b30SLisandro Dalcin b->idiag = NULL; 4901f4259b30SLisandro Dalcin b->mdiag = NULL; 4902f4259b30SLisandro Dalcin b->ssor_work = NULL; 490371f1c65dSBarry Smith b->omega = 1.0; 490471f1c65dSBarry Smith b->fshift = 0.0; 490571f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4906bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4907a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 490817ab2063SBarry Smith 49099566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4910d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 49119566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 49129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4913b3866ffcSBarry Smith #endif 49149566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 49159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 49169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 49179566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 49189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 49199566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 49209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 49219779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 49229566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4923191b95cbSRichard Tran Mills #endif 492434b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 49259566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 49269566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49279566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 492802fe1965SBarry Smith #endif 4929d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4930d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 4931d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 4932d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ)); 4933d5e393b6SSuyash Tandon #endif 49343d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 49359566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 49363d0639e7SStefano Zampini #endif 49379566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4938af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 49399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4940af8000cdSHong Zhang #endif 4941d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 49429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4943d24d4204SJose E. Roman #endif 494463c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 49459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 49469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 494763c07aadSStefano Zampini #endif 49489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 49499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 49509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 49519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 495214e4dea2SJose E. Roman PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ)); 49539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 49549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 4955674b392bSAlexander PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetHash_C", MatResetHash_SeqAIJ)); 49569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 49579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 49589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 49599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 49609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 49629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 49639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 49649566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 49659566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 49669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 49673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 496817ab2063SBarry Smith } 496917ab2063SBarry Smith 4970b24902e0SBarry Smith /* 49713893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4972b24902e0SBarry Smith */ 4973d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4974d71ae5a4SJacob Faibussowitsch { 49752a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4976071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 497717ab2063SBarry Smith 49783a40ed3dSBarry Smith PetscFunctionBegin; 4979aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4980273d9f13SBarry Smith 4981d5f3da31SBarry Smith C->factortype = A->factortype; 4982f4259b30SLisandro Dalcin c->row = NULL; 4983f4259b30SLisandro Dalcin c->col = NULL; 4984f4259b30SLisandro Dalcin c->icol = NULL; 49856ad4291fSHong Zhang c->reallocs = 0; 4986bc43efbbSJunchao Zhang c->diagonaldense = a->diagonaldense; 498717ab2063SBarry Smith 498869272f91SPierre Jolivet C->assembled = A->assembled; 498917ab2063SBarry Smith 499069272f91SPierre Jolivet if (A->preallocated) { 49919566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 49929566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4993eec197d1SBarry Smith 499431fe6a7dSBarry Smith if (!A->hash_active) { 49959566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 49969566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 49979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 49989566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 499917ab2063SBarry Smith 500017ab2063SBarry Smith /* allocate the matrix space */ 5001f77e22a1SHong Zhang if (mallocmatspace) { 50029f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscScalar), (void **)&c->a)); 50039f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscInt), (void **)&c->j)); 50049f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(m + 1, sizeof(PetscInt), (void **)&c->i)); 50059566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 50069f0612e4SBarry Smith c->free_a = PETSC_TRUE; 50079f0612e4SBarry Smith c->free_ij = PETSC_TRUE; 500817ab2063SBarry Smith if (m > 0) { 50099566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 5010be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 50112e5835c6SStefano Zampini const PetscScalar *aa; 50122e5835c6SStefano Zampini 50139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50149566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 50159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 5016be6bf707SBarry Smith } else { 50179566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 501817ab2063SBarry Smith } 501908480c60SBarry Smith } 5020f77e22a1SHong Zhang } 502131fe6a7dSBarry Smith C->preallocated = PETSC_TRUE; 502231fe6a7dSBarry Smith } else { 502331fe6a7dSBarry Smith PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix"); 502431fe6a7dSBarry Smith PetscCall(MatSetUp(C)); 502531fe6a7dSBarry Smith } 502617ab2063SBarry Smith 50276ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 5028416022c9SBarry Smith c->roworiented = a->roworiented; 5029416022c9SBarry Smith c->nonew = a->nonew; 5030416022c9SBarry Smith if (a->diag) { 50319566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 50329566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 5033071fcb05SBarry Smith } else c->diag = NULL; 50342205254eSKarl Rupp 5035f4259b30SLisandro Dalcin c->solve_work = NULL; 5036f4259b30SLisandro Dalcin c->saved_values = NULL; 5037f4259b30SLisandro Dalcin c->idiag = NULL; 5038f4259b30SLisandro Dalcin c->ssor_work = NULL; 5039a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 50406ad4291fSHong Zhang 5041893ad86cSHong Zhang c->rmax = a->rmax; 5042416022c9SBarry Smith c->nz = a->nz; 50438ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 5044754ec7b1SSatish Balay 50456ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 50466ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 5047cd6b891eSBarry Smith if (a->compressedrow.use) { 50486ad4291fSHong Zhang i = a->compressedrow.nrows; 50499566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 50509566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 50519566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 505227ea64f8SHong Zhang } else { 505327ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 50540298fd71SBarry Smith c->compressedrow.i = NULL; 50550298fd71SBarry Smith c->compressedrow.rindex = NULL; 50566ad4291fSHong Zhang } 5057ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 5058e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 50594846f1f5SKris Buschelman 50609566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 506169272f91SPierre Jolivet } 50629566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 50633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 506417ab2063SBarry Smith } 506517ab2063SBarry Smith 5066d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 5067d71ae5a4SJacob Faibussowitsch { 5068b24902e0SBarry Smith PetscFunctionBegin; 50699566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 50709566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 507148a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 50729566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 50739566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 50743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5075b24902e0SBarry Smith } 5076b24902e0SBarry Smith 5077d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 5078d71ae5a4SJacob Faibussowitsch { 507952f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 508052f91c60SVaclav Hapla 508152f91c60SVaclav Hapla PetscFunctionBegin; 508252f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 508352f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 5084c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 50859566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 50869566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 50879566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 508852f91c60SVaclav Hapla if (isbinary) { 50899566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 509052f91c60SVaclav Hapla } else if (ishdf5) { 509152f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 50929566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 509352f91c60SVaclav Hapla #else 509452f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 509552f91c60SVaclav Hapla #endif 509652f91c60SVaclav Hapla } else { 509798921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 509852f91c60SVaclav Hapla } 50993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 510052f91c60SVaclav Hapla } 510152f91c60SVaclav Hapla 5102d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 5103d71ae5a4SJacob Faibussowitsch { 51043ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 51053ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 5106fbdbba38SShri Abhyankar 5107fbdbba38SShri Abhyankar PetscFunctionBegin; 51089566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 5109bbead8a2SBarry Smith 51103ea6fe3dSLisandro Dalcin /* read in matrix header */ 51119566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 511208401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 51139371c9d4SSatish Balay M = header[1]; 51149371c9d4SSatish Balay N = header[2]; 51159371c9d4SSatish Balay nz = header[3]; 511608401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 511708401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 511808401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 5119fbdbba38SShri Abhyankar 51203ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 51219566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 51223ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 51233ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 51243ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 51253ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 51263ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 51279566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 51289566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 51293ea6fe3dSLisandro Dalcin 51303ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 51319566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5132aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51333ea6fe3dSLisandro Dalcin 5134fbdbba38SShri Abhyankar /* read in row lengths */ 51359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 51369566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 51373ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 51389371c9d4SSatish Balay sum = 0; 51399371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 514008401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 51413ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 51429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 51439566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5144aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51453ea6fe3dSLisandro Dalcin /* store row lengths */ 51469566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 51479566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5148fbdbba38SShri Abhyankar 51493ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 51509371c9d4SSatish Balay a->i[0] = 0; 51519371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 51523ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 51539566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 51543ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 51559566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5156fbdbba38SShri Abhyankar 51579566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 51589566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 51593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5160fbdbba38SShri Abhyankar } 5161fbdbba38SShri Abhyankar 5162d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5163d71ae5a4SJacob Faibussowitsch { 51647264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5165fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5166eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5167eeffb40dSHong Zhang PetscInt k; 5168eeffb40dSHong Zhang #endif 51697264ac53SSatish Balay 51703a40ed3dSBarry Smith PetscFunctionBegin; 5171bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5172d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5173ca44d042SBarry Smith *flg = PETSC_FALSE; 51743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5175bcd2baecSBarry Smith } 51767264ac53SSatish Balay 51777264ac53SSatish Balay /* if the a->i are the same */ 51789566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 51793ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 51807264ac53SSatish Balay 51817264ac53SSatish Balay /* if a->j are the same */ 51829566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 51833ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 5184bcd2baecSBarry Smith 51859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 51869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5187bcd2baecSBarry Smith /* if a->a are the same */ 5188eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5189eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5190fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5191eeffb40dSHong Zhang *flg = PETSC_FALSE; 51923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5193eeffb40dSHong Zhang } 5194eeffb40dSHong Zhang } 5195eeffb40dSHong Zhang #else 51969566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5197eeffb40dSHong Zhang #endif 51989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 51999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 52003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52017264ac53SSatish Balay } 520236db0b34SBarry Smith 520305869f15SSatish Balay /*@ 520411a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 520536db0b34SBarry Smith provided by the user. 520636db0b34SBarry Smith 5207d083f849SBarry Smith Collective 520836db0b34SBarry Smith 520936db0b34SBarry Smith Input Parameters: 521036db0b34SBarry Smith + comm - must be an MPI communicator of size 1 521136db0b34SBarry Smith . m - number of rows 521236db0b34SBarry Smith . n - number of columns 5213483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 521436db0b34SBarry Smith . j - column indices 521536db0b34SBarry Smith - a - matrix values 521636db0b34SBarry Smith 521736db0b34SBarry Smith Output Parameter: 521836db0b34SBarry Smith . mat - the matrix 521936db0b34SBarry Smith 522036db0b34SBarry Smith Level: intermediate 522136db0b34SBarry Smith 522236db0b34SBarry Smith Notes: 52232ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 5224292fb18eSBarry Smith once the matrix is destroyed and not before 522536db0b34SBarry Smith 522636db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 522736db0b34SBarry Smith 52282ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 522936db0b34SBarry Smith 5230a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5231a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 52328eef79e4SBarry Smith as shown 52332ef1f0ffSBarry Smith .vb 52342ef1f0ffSBarry Smith 1 0 0 52352ef1f0ffSBarry Smith 2 0 3 52362ef1f0ffSBarry Smith 4 5 6 5237a4552177SSatish Balay 52382ef1f0ffSBarry Smith i = {0,1,3,6} [size = nrow+1 = 3+1] 52392ef1f0ffSBarry Smith j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 52402ef1f0ffSBarry Smith v = {1,2,3,4,5,6} [size = 6] 52412ef1f0ffSBarry Smith .ve 5242a4552177SSatish Balay 52431cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 524436db0b34SBarry Smith @*/ 5245d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5246d71ae5a4SJacob Faibussowitsch { 5247cbcfb4deSHong Zhang PetscInt ii; 524836db0b34SBarry Smith Mat_SeqAIJ *aij; 5249cbcfb4deSHong Zhang PetscInt jj; 525036db0b34SBarry Smith 525136db0b34SBarry Smith PetscFunctionBegin; 5252aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 52539566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 52549566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 52559566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 52569566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 52579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5258ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 52599566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 52609566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5261ab93d7beSBarry Smith 526236db0b34SBarry Smith aij->i = i; 526336db0b34SBarry Smith aij->j = j; 526436db0b34SBarry Smith aij->a = a; 526536db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5266e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5267e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 526836db0b34SBarry Smith 5269cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 527036db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 527176bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5272aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 52739985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 527408401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 527508401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 52769985e31cSBarry Smith } 527736db0b34SBarry Smith } 527876bd3646SJed Brown } 527976bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 528036db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 528108401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5282da0802e2SStefano Zampini PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1); 528336db0b34SBarry Smith } 528476bd3646SJed Brown } 528536db0b34SBarry Smith 52869566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52879566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 528936db0b34SBarry Smith } 5290cbc6b225SStefano Zampini 5291f62e3866SBarry Smith /*@ 529211a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 52938a0b0e6bSVictor Minden provided by the user. 52948a0b0e6bSVictor Minden 5295d083f849SBarry Smith Collective 52968a0b0e6bSVictor Minden 52978a0b0e6bSVictor Minden Input Parameters: 52988a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 52998a0b0e6bSVictor Minden . m - number of rows 53008a0b0e6bSVictor Minden . n - number of columns 53018a0b0e6bSVictor Minden . i - row indices 53028a0b0e6bSVictor Minden . j - column indices 53031230e6d1SVictor Minden . a - matrix values 53041230e6d1SVictor Minden . nz - number of nonzeros 53052ef1f0ffSBarry Smith - idx - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 53068a0b0e6bSVictor Minden 53078a0b0e6bSVictor Minden Output Parameter: 53088a0b0e6bSVictor Minden . mat - the matrix 53098a0b0e6bSVictor Minden 53108a0b0e6bSVictor Minden Level: intermediate 53118a0b0e6bSVictor Minden 5312f62e3866SBarry Smith Example: 5313f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 53149e99939fSJunchao Zhang .vb 53158a0b0e6bSVictor Minden 1 0 0 53168a0b0e6bSVictor Minden 2 0 3 53178a0b0e6bSVictor Minden 4 5 6 53188a0b0e6bSVictor Minden 53198a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 53208a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 53218a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 53229e99939fSJunchao Zhang .ve 5323fe59aa6dSJacob Faibussowitsch 53242ef1f0ffSBarry Smith Note: 5325d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5326d7547e51SJunchao Zhang and are particularly useful in iterative applications. 53278a0b0e6bSVictor Minden 53281cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 53298a0b0e6bSVictor Minden @*/ 5330d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5331d71ae5a4SJacob Faibussowitsch { 5332d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 53338a0b0e6bSVictor Minden 53348a0b0e6bSVictor Minden PetscFunctionBegin; 53359566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5336ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 53379566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 53389566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 53399566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 53409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 53411230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 53421230e6d1SVictor Minden if (idx) { 53431230e6d1SVictor Minden row = i[ii] - 1; 53441230e6d1SVictor Minden col = j[ii] - 1; 53451230e6d1SVictor Minden } else { 53461230e6d1SVictor Minden row = i[ii]; 53471230e6d1SVictor Minden col = j[ii]; 53488a0b0e6bSVictor Minden } 53499566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 53508a0b0e6bSVictor Minden } 53519566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 53529566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 53539566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 53543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53558a0b0e6bSVictor Minden } 535636db0b34SBarry Smith 5357d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5358d71ae5a4SJacob Faibussowitsch { 5359acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5360acf2f550SJed Brown 5361acf2f550SJed Brown PetscFunctionBegin; 5362acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5363acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 53642205254eSKarl Rupp 53659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 53663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5367acf2f550SJed Brown } 5368acf2f550SJed Brown 5369d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5370d71ae5a4SJacob Faibussowitsch { 53719c8f2541SHong Zhang PetscFunctionBegin; 53729566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 53733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53749c8f2541SHong Zhang } 53759c8f2541SHong Zhang 537681824310SBarry Smith /* 537753dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 537853dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 537953dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 538053dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 538153dd7562SDmitry Karpeev */ 5382d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5383d71ae5a4SJacob Faibussowitsch { 538453dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 538553dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 538653dd7562SDmitry Karpeev PetscBool seqaij; 538753dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 538853dd7562SDmitry Karpeev PetscScalar v; 538953dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 539053dd7562SDmitry Karpeev 539153dd7562SDmitry Karpeev PetscFunctionBegin; 53923ba16761SJacob Faibussowitsch if (!B) PetscFunctionReturn(PETSC_SUCCESS); 539353dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 53949566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 539528b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 539653dd7562SDmitry Karpeev if (rowemb) { 53979566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 539808401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 539953dd7562SDmitry Karpeev } else { 540008401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 540153dd7562SDmitry Karpeev } 540253dd7562SDmitry Karpeev if (colemb) { 54039566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 540408401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 540553dd7562SDmitry Karpeev } else { 540608401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 540753dd7562SDmitry Karpeev } 540853dd7562SDmitry Karpeev 5409f4f49eeaSPierre Jolivet Baij = (Mat_SeqAIJ *)B->data; 541053dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 54119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5412ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 54139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 54149566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 541553dd7562SDmitry Karpeev } 541648a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 541753dd7562SDmitry Karpeev count = 0; 541853dd7562SDmitry Karpeev rowindices = NULL; 541953dd7562SDmitry Karpeev colindices = NULL; 542048a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 542148a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 542253dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 542353dd7562SDmitry Karpeev PetscInt row; 542453dd7562SDmitry Karpeev row = i; 542553dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 542653dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 542753dd7562SDmitry Karpeev PetscInt col; 542853dd7562SDmitry Karpeev col = Baij->j[count]; 542953dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 543053dd7562SDmitry Karpeev v = Baij->a[count]; 54319566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 543253dd7562SDmitry Karpeev ++count; 543353dd7562SDmitry Karpeev } 543453dd7562SDmitry Karpeev } 543553dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 543653dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 543753dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 543853dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 543953dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 54403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 544153dd7562SDmitry Karpeev } 544253dd7562SDmitry Karpeev 544358c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep) 5444dec0b466SHong Zhang { 5445dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5446dec0b466SHong Zhang MatScalar *aa = a->a; 5447dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5448dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5449dec0b466SHong Zhang 5450dec0b466SHong Zhang PetscFunctionBegin; 5451dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5452dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5453dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5454dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5455dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 545658c11ad4SPierre Jolivet if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++; 5457dec0b466SHong Zhang else { 5458dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5459dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5460dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5461dec0b466SHong Zhang } 5462dec0b466SHong Zhang } 5463dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5464dec0b466SHong Zhang fshift_prev = fshift; 5465dec0b466SHong Zhang /* reset ilen and imax for each row */ 5466dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5467dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5468dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5469dec0b466SHong Zhang } 5470312eded4SPierre Jolivet if (fshift) { 5471dec0b466SHong Zhang if (m) { 5472dec0b466SHong Zhang ai[m] -= fshift; 5473dec0b466SHong Zhang a->nz = ai[m]; 5474dec0b466SHong Zhang } 5475dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5476312eded4SPierre Jolivet A->nonzerostate++; 5477dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5478dec0b466SHong Zhang a->rmax = rmax; 5479dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5480dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5481dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 5482312eded4SPierre Jolivet } 54833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5484dec0b466SHong Zhang } 5485dec0b466SHong Zhang 54864099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 54874099cc6bSBarry Smith 5488cc4c1da9SBarry Smith /*@ 548911a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 54904099cc6bSBarry Smith 5491c3339decSBarry Smith Collective 54924099cc6bSBarry Smith 54934099cc6bSBarry Smith Input Parameters: 54944099cc6bSBarry Smith + mat - the matrix object 54954099cc6bSBarry Smith - matype - matrix type 54964099cc6bSBarry Smith 54974099cc6bSBarry Smith Options Database Key: 54984e187271SRichard Tran Mills . -mat_seqaij_type <method> - for example seqaijcrl 54994099cc6bSBarry Smith 55004099cc6bSBarry Smith Level: intermediate 55014099cc6bSBarry Smith 5502fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType` 55034099cc6bSBarry Smith @*/ 5504d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5505d71ae5a4SJacob Faibussowitsch { 55064099cc6bSBarry Smith PetscBool sametype; 55075f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 55084099cc6bSBarry Smith 55094099cc6bSBarry Smith PetscFunctionBegin; 55104099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 55119566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 55123ba16761SJacob Faibussowitsch if (sametype) PetscFunctionReturn(PETSC_SUCCESS); 55134099cc6bSBarry Smith 55149566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 55156adde796SStefano Zampini PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 55169566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 55173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55184099cc6bSBarry Smith } 55194099cc6bSBarry Smith 55204099cc6bSBarry Smith /*@C 552111a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 55224099cc6bSBarry Smith 5523cc4c1da9SBarry Smith Not Collective, No Fortran Support 55244099cc6bSBarry Smith 55254099cc6bSBarry Smith Input Parameters: 5526fe59aa6dSJacob Faibussowitsch + sname - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 55274099cc6bSBarry Smith - function - routine to convert to subtype 55284099cc6bSBarry Smith 55292ef1f0ffSBarry Smith Level: advanced 55302ef1f0ffSBarry Smith 55314099cc6bSBarry Smith Notes: 553211a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 55334099cc6bSBarry Smith 55344099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 55354099cc6bSBarry Smith $ -mat_seqaij_type my_mat 55364099cc6bSBarry Smith 55371cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()` 55384099cc6bSBarry Smith @*/ 5539d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5540d71ae5a4SJacob Faibussowitsch { 55414099cc6bSBarry Smith PetscFunctionBegin; 55429566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 55439566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 55443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55454099cc6bSBarry Smith } 55464099cc6bSBarry Smith 55474099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 55484099cc6bSBarry Smith 55494099cc6bSBarry Smith /*@C 555011a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 55514099cc6bSBarry Smith 55524099cc6bSBarry Smith Not Collective 55534099cc6bSBarry Smith 55544099cc6bSBarry Smith Level: advanced 55554099cc6bSBarry Smith 55562ef1f0ffSBarry Smith Note: 55572ef1f0ffSBarry Smith This registers the versions of `MATSEQAIJ` for GPUs 55582ef1f0ffSBarry Smith 55591cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()` 55604099cc6bSBarry Smith @*/ 5561d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5562d71ae5a4SJacob Faibussowitsch { 55634099cc6bSBarry Smith PetscFunctionBegin; 55643ba16761SJacob Faibussowitsch if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS); 55654099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 55664099cc6bSBarry Smith 55679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 55689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 55699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 55709779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 55719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5572485f9817SRichard Tran Mills #endif 55735063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 55749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 55755063d097SStefano Zampini #endif 5576d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 5577d5e393b6SSuyash Tandon PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 5578d5e393b6SSuyash Tandon #endif 55795063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 55809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 55815063d097SStefano Zampini #endif 55824099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 55839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 55844099cc6bSBarry Smith #endif 55853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55864099cc6bSBarry Smith } 558753dd7562SDmitry Karpeev 558853dd7562SDmitry Karpeev /* 558981824310SBarry Smith Special version for direct calls from Fortran 559081824310SBarry Smith */ 559181824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 559281824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 559381824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 559481824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 559581824310SBarry Smith #endif 559681824310SBarry Smith 559781824310SBarry Smith /* Change these macros so can be used in void function */ 559898921bdaSJacob Faibussowitsch 559998921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 56009566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 56019566063dSJacob Faibussowitsch #undef PetscCall 56029371c9d4SSatish Balay #define PetscCall(...) \ 56039371c9d4SSatish Balay do { \ 56045f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 560598921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 560698921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 560798921bdaSJacob Faibussowitsch return; \ 560898921bdaSJacob Faibussowitsch } \ 560998921bdaSJacob Faibussowitsch } while (0) 561098921bdaSJacob Faibussowitsch 561198921bdaSJacob Faibussowitsch #undef SETERRQ 56129371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 56139371c9d4SSatish Balay do { \ 561498921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 561598921bdaSJacob Faibussowitsch return; \ 561698921bdaSJacob Faibussowitsch } while (0) 561781824310SBarry Smith 5618d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5619d71ae5a4SJacob Faibussowitsch { 562081824310SBarry Smith Mat A = *AA; 562181824310SBarry Smith PetscInt m = *mm, n = *nn; 562281824310SBarry Smith InsertMode is = *isis; 562381824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 562481824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 562581824310SBarry Smith PetscInt *imax, *ai, *ailen; 562681824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 562754f21887SBarry Smith MatScalar *ap, value, *aa; 5628ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5629ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 563081824310SBarry Smith 563181824310SBarry Smith PetscFunctionBegin; 56324994cf47SJed Brown MatCheckPreallocated(A, 1); 563381824310SBarry Smith imax = a->imax; 563481824310SBarry Smith ai = a->i; 563581824310SBarry Smith ailen = a->ilen; 563681824310SBarry Smith aj = a->j; 563781824310SBarry Smith aa = a->a; 563881824310SBarry Smith 563981824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 564081824310SBarry Smith row = im[k]; 564181824310SBarry Smith if (row < 0) continue; 56425f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 56439371c9d4SSatish Balay rp = aj + ai[row]; 56449371c9d4SSatish Balay ap = aa + ai[row]; 56459371c9d4SSatish Balay rmax = imax[row]; 56469371c9d4SSatish Balay nrow = ailen[row]; 564781824310SBarry Smith low = 0; 564881824310SBarry Smith high = nrow; 564981824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 565081824310SBarry Smith if (in[l] < 0) continue; 56515f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 565281824310SBarry Smith col = in[l]; 56532205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 56542205254eSKarl Rupp else value = v[k + l * m]; 56552205254eSKarl Rupp 565681824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 565781824310SBarry Smith 56582205254eSKarl Rupp if (col <= lastcol) low = 0; 56592205254eSKarl Rupp else high = nrow; 566081824310SBarry Smith lastcol = col; 566181824310SBarry Smith while (high - low > 5) { 566281824310SBarry Smith t = (low + high) / 2; 566381824310SBarry Smith if (rp[t] > col) high = t; 566481824310SBarry Smith else low = t; 566581824310SBarry Smith } 566681824310SBarry Smith for (i = low; i < high; i++) { 566781824310SBarry Smith if (rp[i] > col) break; 566881824310SBarry Smith if (rp[i] == col) { 566981824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 567081824310SBarry Smith else ap[i] = value; 567181824310SBarry Smith goto noinsert; 567281824310SBarry Smith } 567381824310SBarry Smith } 567481824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 567581824310SBarry Smith if (nonew == 1) goto noinsert; 56765f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5677fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 56789371c9d4SSatish Balay N = nrow++ - 1; 56799371c9d4SSatish Balay a->nz++; 56809371c9d4SSatish Balay high++; 568181824310SBarry Smith /* shift up all the later entries in this row */ 568281824310SBarry Smith for (ii = N; ii >= i; ii--) { 568381824310SBarry Smith rp[ii + 1] = rp[ii]; 568481824310SBarry Smith ap[ii + 1] = ap[ii]; 568581824310SBarry Smith } 568681824310SBarry Smith rp[i] = col; 568781824310SBarry Smith ap[i] = value; 568881824310SBarry Smith noinsert:; 568981824310SBarry Smith low = i + 1; 569081824310SBarry Smith } 569181824310SBarry Smith ailen[row] = nrow; 569281824310SBarry Smith } 569381824310SBarry Smith PetscFunctionReturnVoid(); 569481824310SBarry Smith } 569598921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 569698921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 569798921bdaSJacob Faibussowitsch * original definitions */ 56989566063dSJacob Faibussowitsch #undef PetscCall 569998921bdaSJacob Faibussowitsch #undef SETERRQ 5700