1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1226cec326SBarry Smith #define TYPE AIJ 1326cec326SBarry Smith #define TYPE_BS 1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 1626cec326SBarry Smith #undef TYPE 1726cec326SBarry Smith #undef TYPE_BS 1826cec326SBarry Smith 19421480d9SBarry Smith MatGetDiagonalMarkers(SeqAIJ, 1) 20421480d9SBarry Smith 21ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 22d71ae5a4SJacob Faibussowitsch { 234099cc6bSBarry Smith PetscBool flg; 244099cc6bSBarry Smith char type[256]; 254099cc6bSBarry Smith 264099cc6bSBarry Smith PetscFunctionBegin; 27d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 289566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 299566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 30d0609cedSBarry Smith PetscOptionsEnd(); 313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 324099cc6bSBarry Smith } 334099cc6bSBarry Smith 34ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 35d71ae5a4SJacob Faibussowitsch { 360716a85fSBarry Smith PetscInt i, m, n; 370716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 380716a85fSBarry Smith 390716a85fSBarry Smith PetscFunctionBegin; 409566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 419566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 420716a85fSBarry Smith if (type == NORM_2) { 43ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 440716a85fSBarry Smith } else if (type == NORM_1) { 45ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 460716a85fSBarry Smith } else if (type == NORM_INFINITY) { 47ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 49ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 50857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 51ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 526adde796SStefano Zampini } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 530716a85fSBarry Smith 540716a85fSBarry Smith if (type == NORM_2) { 55a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 56857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 57a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 580716a85fSBarry Smith } 593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 600716a85fSBarry Smith } 610716a85fSBarry Smith 62ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 63d71ae5a4SJacob Faibussowitsch { 643a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 653a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 663a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 673a062f41SBarry Smith PetscInt *rows; 683a062f41SBarry Smith 693a062f41SBarry Smith PetscFunctionBegin; 703a062f41SBarry Smith for (i = 0; i < m; i++) { 71ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 723a062f41SBarry Smith } 739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 743a062f41SBarry Smith cnt = 0; 753a062f41SBarry Smith for (i = 0; i < m; i++) { 763a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 773a062f41SBarry Smith rows[cnt] = i; 783a062f41SBarry Smith cnt++; 793a062f41SBarry Smith } 803a062f41SBarry Smith } 819566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 833a062f41SBarry Smith } 843a062f41SBarry Smith 85d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 86d71ae5a4SJacob Faibussowitsch { 876ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 88fff043a9SJunchao Zhang const MatScalar *aa; 896ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 90b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 916ce1633cSBarry Smith PetscInt *rows; 926ce1633cSBarry Smith 936ce1633cSBarry Smith PetscFunctionBegin; 949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 95421480d9SBarry Smith PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, NULL)); 966ce1633cSBarry Smith for (i = 0; i < m; i++) { 97ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 986ce1633cSBarry Smith } 999566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 1006ce1633cSBarry Smith cnt = 0; 1016ce1633cSBarry Smith for (i = 0; i < m; i++) { 102ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 1036ce1633cSBarry Smith } 104f1f41ecbSJed Brown *nrows = cnt; 105f1f41ecbSJed Brown *zrows = rows; 1069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 108f1f41ecbSJed Brown } 109f1f41ecbSJed Brown 110ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 111d71ae5a4SJacob Faibussowitsch { 112f1f41ecbSJed Brown PetscInt nrows, *rows; 113f1f41ecbSJed Brown 114f1f41ecbSJed Brown PetscFunctionBegin; 1150298fd71SBarry Smith *zrows = NULL; 1169566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1179566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1196ce1633cSBarry Smith } 1206ce1633cSBarry Smith 121ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 122d71ae5a4SJacob Faibussowitsch { 123b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 124b3a44c85SBarry Smith const MatScalar *aa; 125b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 126b3a44c85SBarry Smith const PetscInt *ii; 127b3a44c85SBarry Smith PetscInt n, i, j, *rows; 128b3a44c85SBarry Smith 129b3a44c85SBarry Smith PetscFunctionBegin; 1309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 131f4259b30SLisandro Dalcin *keptrows = NULL; 132b3a44c85SBarry Smith ii = a->i; 133b3a44c85SBarry Smith for (i = 0; i < m; i++) { 134b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 135b3a44c85SBarry Smith if (!n) { 136b3a44c85SBarry Smith cnt++; 137b3a44c85SBarry Smith goto ok1; 138b3a44c85SBarry Smith } 1392e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 140b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 141b3a44c85SBarry Smith } 142b3a44c85SBarry Smith cnt++; 143b3a44c85SBarry Smith ok1:; 144b3a44c85SBarry Smith } 1452e5835c6SStefano Zampini if (!cnt) { 1469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1482e5835c6SStefano Zampini } 1499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 150b3a44c85SBarry Smith cnt = 0; 151b3a44c85SBarry Smith for (i = 0; i < m; i++) { 152b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 153b3a44c85SBarry Smith if (!n) continue; 1542e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 155b3a44c85SBarry Smith if (aa[j] != 0.0) { 156b3a44c85SBarry Smith rows[cnt++] = i; 157b3a44c85SBarry Smith break; 158b3a44c85SBarry Smith } 159b3a44c85SBarry Smith } 160b3a44c85SBarry Smith } 1619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1629566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 1633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 164b3a44c85SBarry Smith } 165b3a44c85SBarry Smith 166d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 167d71ae5a4SJacob Faibussowitsch { 16899e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16999e65526SBarry Smith const PetscInt *diag; 1702e5835c6SStefano Zampini MatScalar *aa; 17199e65526SBarry Smith const PetscScalar *v; 172421480d9SBarry Smith PetscBool diagDense; 17379299369SBarry Smith 17479299369SBarry Smith PetscFunctionBegin; 17509f38230SBarry Smith if (Y->assembled) { 176421480d9SBarry Smith PetscCall(MatGetDiagonalMarkers_SeqAIJ(Y, &diag, &diagDense)); 177421480d9SBarry Smith if (diagDense) { 1789566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 18079299369SBarry Smith if (is == INSERT_VALUES) { 181ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 18279299369SBarry Smith } else { 183ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 18479299369SBarry Smith } 1859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1869566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 1873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18879299369SBarry Smith } 18909f38230SBarry Smith } 1909566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 1913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 19209f38230SBarry Smith } 19379299369SBarry Smith 194d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 195d71ae5a4SJacob Faibussowitsch { 196416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19797f1f81fSBarry Smith PetscInt i, ishift; 19817ab2063SBarry Smith 1993a40ed3dSBarry Smith PetscFunctionBegin; 200f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 2013ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 202bfeeae90SHong Zhang ishift = 0; 203b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 2049566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 205bfeeae90SHong Zhang } else if (oshift == 1) { 2061a83f524SJed Brown PetscInt *tia; 207d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2089234b629SBarry Smith 2093b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2109566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2111a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2121a83f524SJed Brown *ia = tia; 213ecc77c7aSBarry Smith if (ja) { 2141a83f524SJed Brown PetscInt *tja; 2159234b629SBarry Smith 2169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2171a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2181a83f524SJed Brown *ja = tja; 219ecc77c7aSBarry Smith } 2206945ee14SBarry Smith } else { 221ecc77c7aSBarry Smith *ia = a->i; 222ecc77c7aSBarry Smith if (ja) *ja = a->j; 223a2ce50c7SBarry Smith } 2243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225a2744918SBarry Smith } 226a2744918SBarry Smith 227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 228d71ae5a4SJacob Faibussowitsch { 2293a40ed3dSBarry Smith PetscFunctionBegin; 2303ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 231b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2329566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2339566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 234bcd2baecSBarry Smith } 2353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23617ab2063SBarry Smith } 23717ab2063SBarry Smith 238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 239d71ae5a4SJacob Faibussowitsch { 2403b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 241d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 24297f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2433b2fbd54SBarry Smith 2443a40ed3dSBarry Smith PetscFunctionBegin; 245899cda47SBarry Smith *nn = n; 2463ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2473b2fbd54SBarry Smith if (symmetric) { 2489566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2493b2fbd54SBarry Smith } else { 2509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2533b2fbd54SBarry Smith jj = a->j; 254ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2553b2fbd54SBarry Smith cia[0] = oshift; 256ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2583b2fbd54SBarry Smith jj = a->j; 259a93ec695SBarry Smith for (row = 0; row < m; row++) { 260a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 261a93ec695SBarry Smith for (i = 0; i < mr; i++) { 262bfeeae90SHong Zhang col = *jj++; 2632205254eSKarl Rupp 2643b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2653b2fbd54SBarry Smith } 2663b2fbd54SBarry Smith } 2679566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2689371c9d4SSatish Balay *ia = cia; 2699371c9d4SSatish Balay *ja = cja; 2703b2fbd54SBarry Smith } 2713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2723b2fbd54SBarry Smith } 2733b2fbd54SBarry Smith 274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 275d71ae5a4SJacob Faibussowitsch { 2763a40ed3dSBarry Smith PetscFunctionBegin; 2773ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2783b2fbd54SBarry Smith 2799566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2809566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2823b2fbd54SBarry Smith } 2833b2fbd54SBarry Smith 2847cee066cSHong Zhang /* 2857cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2867cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 287040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2887cee066cSHong Zhang */ 289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 290d71ae5a4SJacob Faibussowitsch { 2917cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2927cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 293071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2947cee066cSHong Zhang PetscInt *cspidx; 295071fcb05SBarry Smith const PetscInt *jj; 2967cee066cSHong Zhang 2977cee066cSHong Zhang PetscFunctionBegin; 2987cee066cSHong Zhang *nn = n; 2993ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 300625f6d37SHong Zhang 3019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 3029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 3039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 3057cee066cSHong Zhang jj = a->j; 306ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 3077cee066cSHong Zhang cia[0] = oshift; 308ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3107cee066cSHong Zhang jj = a->j; 3117cee066cSHong Zhang for (row = 0; row < m; row++) { 3127cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3137cee066cSHong Zhang for (i = 0; i < mr; i++) { 3147cee066cSHong Zhang col = *jj++; 315071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 316071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 317071fcb05SBarry Smith cja[tmp] = row + oshift; 3187cee066cSHong Zhang } 3197cee066cSHong Zhang } 3209566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 321071fcb05SBarry Smith *ia = cia; 322071fcb05SBarry Smith *ja = cja; 3237cee066cSHong Zhang *spidx = cspidx; 3243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 328d71ae5a4SJacob Faibussowitsch { 3297cee066cSHong Zhang PetscFunctionBegin; 3309566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3319566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3337cee066cSHong Zhang } 3347cee066cSHong Zhang 335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 336d71ae5a4SJacob Faibussowitsch { 33787d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33887d4246cSBarry Smith PetscInt *ai = a->i; 339fff043a9SJunchao Zhang PetscScalar *aa; 34087d4246cSBarry Smith 34187d4246cSBarry Smith PetscFunctionBegin; 3429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34687d4246cSBarry Smith } 34787d4246cSBarry Smith 348bd04181cSBarry Smith /* 349bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 350bd04181cSBarry Smith 351bd04181cSBarry Smith - a single row of values is set with each call 352bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 353bd04181cSBarry Smith - the values are always added to the matrix, not set 354bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 355bd04181cSBarry Smith 3561f763a69SBarry Smith This does NOT assume the global column indices are sorted 357bd04181cSBarry Smith 3581f763a69SBarry Smith */ 359bd04181cSBarry Smith 360af0996ceSBarry Smith #include <petsc/private/isimpl.h> 361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 362d71ae5a4SJacob Faibussowitsch { 363189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3641f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3651f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3661f763a69SBarry Smith PetscInt lastcol = -1; 367fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 368189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 369189e4007SBarry Smith 370fff043a9SJunchao Zhang PetscFunctionBegin; 3719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 372f38dd0b8SBarry Smith row = ridx[im[0]]; 3731f763a69SBarry Smith rp = aj + ai[row]; 3741f763a69SBarry Smith ap = aa + ai[row]; 3751f763a69SBarry Smith nrow = ailen[row]; 376189e4007SBarry Smith low = 0; 377189e4007SBarry Smith high = nrow; 378189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 379189e4007SBarry Smith col = cidx[in[l]]; 380f38dd0b8SBarry Smith value = v[l]; 381189e4007SBarry Smith 382189e4007SBarry Smith if (col <= lastcol) low = 0; 383189e4007SBarry Smith else high = nrow; 384189e4007SBarry Smith lastcol = col; 385189e4007SBarry Smith while (high - low > 5) { 386189e4007SBarry Smith t = (low + high) / 2; 387189e4007SBarry Smith if (rp[t] > col) high = t; 388189e4007SBarry Smith else low = t; 389189e4007SBarry Smith } 390189e4007SBarry Smith for (i = low; i < high; i++) { 391189e4007SBarry Smith if (rp[i] == col) { 3921f763a69SBarry Smith ap[i] += value; 393189e4007SBarry Smith low = i + 1; 3941f763a69SBarry Smith break; 395189e4007SBarry Smith } 396189e4007SBarry Smith } 397189e4007SBarry Smith } 3989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3993ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 400189e4007SBarry Smith } 401189e4007SBarry Smith 402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 403d71ae5a4SJacob Faibussowitsch { 404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 405e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 40697f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 407e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 408ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 409ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 410ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 41117ab2063SBarry Smith 4123a40ed3dSBarry Smith PetscFunctionBegin; 4139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 41417ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 415416022c9SBarry Smith row = im[k]; 4165ef9f2a5SBarry Smith if (row < 0) continue; 4176bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 4188e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 4198e3a54c0SPierre Jolivet if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]); 4209371c9d4SSatish Balay rmax = imax[row]; 4219371c9d4SSatish Balay nrow = ailen[row]; 422416022c9SBarry Smith low = 0; 423c71e6ed7SBarry Smith high = nrow; 42417ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4255ef9f2a5SBarry Smith if (in[l] < 0) continue; 4266bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 427bfeeae90SHong Zhang col = in[l]; 428071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 429071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 43036db0b34SBarry Smith 4312205254eSKarl Rupp if (col <= lastcol) low = 0; 4322205254eSKarl Rupp else high = nrow; 433e2ee6c50SBarry Smith lastcol = col; 434416022c9SBarry Smith while (high - low > 5) { 435416022c9SBarry Smith t = (low + high) / 2; 436416022c9SBarry Smith if (rp[t] > col) high = t; 437416022c9SBarry Smith else low = t; 43817ab2063SBarry Smith } 439416022c9SBarry Smith for (i = low; i < high; i++) { 44017ab2063SBarry Smith if (rp[i] > col) break; 44117ab2063SBarry Smith if (rp[i] == col) { 442876c6284SHong Zhang if (!A->structure_only) { 4430c0d7e18SFande Kong if (is == ADD_VALUES) { 4440c0d7e18SFande Kong ap[i] += value; 4450c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4469371c9d4SSatish Balay } else ap[i] = value; 447720833daSHong Zhang } 448e44c0bd4SBarry Smith low = i + 1; 44917ab2063SBarry Smith goto noinsert; 45017ab2063SBarry Smith } 45117ab2063SBarry Smith } 452dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 453c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 45408401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 455720833daSHong Zhang if (A->structure_only) { 456876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 457720833daSHong Zhang } else { 458fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 459720833daSHong Zhang } 4609371c9d4SSatish Balay N = nrow++ - 1; 4619371c9d4SSatish Balay a->nz++; 4629371c9d4SSatish Balay high++; 463416022c9SBarry Smith /* shift up all the later entries in this row */ 4649566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 46517ab2063SBarry Smith rp[i] = col; 466580bdb30SBarry Smith if (!A->structure_only) { 4679566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 468580bdb30SBarry Smith ap[i] = value; 469580bdb30SBarry Smith } 470416022c9SBarry Smith low = i + 1; 471e44c0bd4SBarry Smith noinsert:; 47217ab2063SBarry Smith } 47317ab2063SBarry Smith ailen[row] = nrow; 47417ab2063SBarry Smith } 4759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 47717ab2063SBarry Smith } 47817ab2063SBarry Smith 479ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 480d71ae5a4SJacob Faibussowitsch { 48119b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 48219b08ed1SBarry Smith PetscInt *rp, k, row; 48319b08ed1SBarry Smith PetscInt *ai = a->i; 48419b08ed1SBarry Smith PetscInt *aj = a->j; 485fff043a9SJunchao Zhang MatScalar *aa, *ap; 48619b08ed1SBarry Smith 48719b08ed1SBarry Smith PetscFunctionBegin; 48828b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 48908401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 490fff043a9SJunchao Zhang 4919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 49219b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 49319b08ed1SBarry Smith row = im[k]; 49419b08ed1SBarry Smith rp = aj + ai[row]; 4958e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 49619b08ed1SBarry Smith 497*418fb43bSPierre Jolivet PetscCall(PetscArraycpy(rp, in, n)); 49819b08ed1SBarry Smith if (!A->structure_only) { 49919b08ed1SBarry Smith if (v) { 500*418fb43bSPierre Jolivet PetscCall(PetscArraycpy(ap, v, n)); 50119b08ed1SBarry Smith v += n; 50219b08ed1SBarry Smith } else { 5039566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 50419b08ed1SBarry Smith } 50519b08ed1SBarry Smith } 50619b08ed1SBarry Smith a->ilen[row] = n; 50719b08ed1SBarry Smith a->imax[row] = n; 50819b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 50919b08ed1SBarry Smith a->nz += n; 51019b08ed1SBarry Smith } 5119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51319b08ed1SBarry Smith } 51419b08ed1SBarry Smith 51519b08ed1SBarry Smith /*@ 51619b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51719b08ed1SBarry Smith 51819b08ed1SBarry Smith Input Parameters: 51911a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 52019b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 52119b08ed1SBarry Smith 52219b08ed1SBarry Smith Level: advanced 52319b08ed1SBarry Smith 52419b08ed1SBarry Smith Notes: 52519b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 52611a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52719b08ed1SBarry Smith as always with multiple matrix assemblies. 52819b08ed1SBarry Smith 5291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 53019b08ed1SBarry Smith @*/ 531d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 532d71ae5a4SJacob Faibussowitsch { 53319b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 53419b08ed1SBarry Smith 53519b08ed1SBarry Smith PetscFunctionBegin; 5369566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5379566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53819b08ed1SBarry Smith a->maxnz = nztotal; 5393a7d0413SPierre Jolivet if (!a->imax) PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); 54019b08ed1SBarry Smith if (!a->ilen) { 5419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 54219b08ed1SBarry Smith } else { 5439566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 54419b08ed1SBarry Smith } 54519b08ed1SBarry Smith 54619b08ed1SBarry Smith /* allocate the matrix space */ 5479f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(A->rmap->n + 1, sizeof(PetscInt), (void **)&a->i)); 5489f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscInt), (void **)&a->j)); 5499f0612e4SBarry Smith a->free_ij = PETSC_TRUE; 55019b08ed1SBarry Smith if (A->structure_only) { 55119b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55219b08ed1SBarry Smith } else { 5539f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscScalar), (void **)&a->a)); 55419b08ed1SBarry Smith a->free_a = PETSC_TRUE; 55519b08ed1SBarry Smith } 5569f0612e4SBarry Smith a->i[0] = 0; 55719b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 55819b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 5593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56019b08ed1SBarry Smith } 56119b08ed1SBarry Smith 562ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 563d71ae5a4SJacob Faibussowitsch { 564071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 565071fcb05SBarry Smith PetscInt *rp, k, row; 566071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 567071fcb05SBarry Smith PetscInt *aj = a->j; 568fff043a9SJunchao Zhang MatScalar *aa, *ap; 569071fcb05SBarry Smith 570071fcb05SBarry Smith PetscFunctionBegin; 5719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 572071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 573071fcb05SBarry Smith row = im[k]; 5746bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 575071fcb05SBarry Smith rp = aj + ai[row]; 576071fcb05SBarry Smith ap = aa + ai[row]; 577*418fb43bSPierre Jolivet if (!A->was_assembled) PetscCall(PetscArraycpy(rp, in, n)); 578071fcb05SBarry Smith if (!A->structure_only) { 579071fcb05SBarry Smith if (v) { 580*418fb43bSPierre Jolivet PetscCall(PetscArraycpy(ap, v, n)); 581071fcb05SBarry Smith v += n; 582071fcb05SBarry Smith } else { 5839566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 584071fcb05SBarry Smith } 585071fcb05SBarry Smith } 586071fcb05SBarry Smith ailen[row] = n; 587071fcb05SBarry Smith a->nz += n; 588071fcb05SBarry Smith } 5899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 591071fcb05SBarry Smith } 592071fcb05SBarry Smith 593ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 594d71ae5a4SJacob Faibussowitsch { 5957eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 59697f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59797f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 5984e208921SJed Brown const MatScalar *ap, *aa; 5997eb43aa7SLois Curfman McInnes 6003a40ed3dSBarry Smith PetscFunctionBegin; 6014e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6027eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6037eb43aa7SLois Curfman McInnes row = im[k]; 6049371c9d4SSatish Balay if (row < 0) { 6059371c9d4SSatish Balay v += n; 6069371c9d4SSatish Balay continue; 6079371c9d4SSatish Balay } /* negative row */ 60854c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6098e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 6108e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 6117eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6127eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6139371c9d4SSatish Balay if (in[l] < 0) { 6149371c9d4SSatish Balay v++; 6159371c9d4SSatish Balay continue; 6169371c9d4SSatish Balay } /* negative column */ 61754c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 618bfeeae90SHong Zhang col = in[l]; 6199371c9d4SSatish Balay high = nrow; 6209371c9d4SSatish Balay low = 0; /* assume unsorted */ 6217eb43aa7SLois Curfman McInnes while (high - low > 5) { 6227eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6237eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6247eb43aa7SLois Curfman McInnes else low = t; 6257eb43aa7SLois Curfman McInnes } 6267eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6277eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6287eb43aa7SLois Curfman McInnes if (rp[i] == col) { 629b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6307eb43aa7SLois Curfman McInnes goto finished; 6317eb43aa7SLois Curfman McInnes } 6327eb43aa7SLois Curfman McInnes } 63397e567efSBarry Smith *v++ = 0.0; 6347eb43aa7SLois Curfman McInnes finished:; 6357eb43aa7SLois Curfman McInnes } 6367eb43aa7SLois Curfman McInnes } 6374e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6397eb43aa7SLois Curfman McInnes } 6407eb43aa7SLois Curfman McInnes 641ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 642d71ae5a4SJacob Faibussowitsch { 6433ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 644c898d852SStefano Zampini const PetscScalar *av; 6453ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6463ea6fe3dSLisandro Dalcin PetscInt *rowlens; 64717ab2063SBarry Smith 6483a40ed3dSBarry Smith PetscFunctionBegin; 6499566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6502205254eSKarl Rupp 6513ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6523ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6533ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6543ea6fe3dSLisandro Dalcin nz = A->nz; 655416022c9SBarry Smith 6563ea6fe3dSLisandro Dalcin /* write matrix header */ 6573ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6589371c9d4SSatish Balay header[1] = M; 6599371c9d4SSatish Balay header[2] = N; 6609371c9d4SSatish Balay header[3] = nz; 6619566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 662416022c9SBarry Smith 6633ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6653ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 666e457bb90SBarry Smith if (PetscDefined(USE_DEBUG)) { 667e457bb90SBarry Smith PetscInt mnz = 0; 668e457bb90SBarry Smith 669e457bb90SBarry Smith for (i = 0; i < m; i++) mnz += rowlens[i]; 670e457bb90SBarry Smith PetscCheck(nz == mnz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row lens %" PetscInt_FMT " do not sum to nz %" PetscInt_FMT, mnz, nz); 671e457bb90SBarry Smith } 6729566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6739566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6743ea6fe3dSLisandro Dalcin /* store column indices */ 6759566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 676416022c9SBarry Smith /* store nonzero values */ 6779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6789566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 680b37d52dbSMark F. Adams 6813ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6829566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 68417ab2063SBarry Smith } 685416022c9SBarry Smith 686d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 687d71ae5a4SJacob Faibussowitsch { 6887dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6897dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6907dc0baabSHong Zhang 6917dc0baabSHong Zhang PetscFunctionBegin; 6929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6937dc0baabSHong Zhang for (i = 0; i < m; i++) { 6949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 69548a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6977dc0baabSHong Zhang } 6989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7007dc0baabSHong Zhang } 7017dc0baabSHong Zhang 702ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 703d71ae5a4SJacob Faibussowitsch { 704416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 705c898d852SStefano Zampini const PetscScalar *av; 70660e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 707e060cb09SBarry Smith const char *name; 708f3ef73ceSBarry Smith PetscViewerFormat format; 70917ab2063SBarry Smith 7103a40ed3dSBarry Smith PetscFunctionBegin; 7117dc0baabSHong Zhang if (A->structure_only) { 7129566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7147dc0baabSHong Zhang } 71543e49210SHong Zhang 7169566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 717bd6a2ce3SJunchao Zhang // By petsc's rule, even PETSC_VIEWER_ASCII_INFO_DETAIL doesn't print matrix entries 7183ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 7192e5835c6SStefano Zampini 720c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 72371c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 72497f1f81fSBarry Smith PetscInt nofinalvalue = 0; 72560e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 726c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 727d00d2cf4SBarry Smith nofinalvalue = 1; 728d00d2cf4SBarry Smith } 7299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 732fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 734fbfe6fa7SJed Brown #else 7359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 736fbfe6fa7SJed Brown #endif 7379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73817ab2063SBarry Smith 73917ab2063SBarry Smith for (i = 0; i < m; i++) { 74060e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 741aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 74317ab2063SBarry Smith #else 7449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 74517ab2063SBarry Smith #endif 74617ab2063SBarry Smith } 74717ab2063SBarry Smith } 748d00d2cf4SBarry Smith if (nofinalvalue) { 749c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 751c337ccceSJed Brown #else 7529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 753c337ccceSJed Brown #endif 754d00d2cf4SBarry Smith } 7559566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7569566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 758fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 76044cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 76260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 763aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 76436db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7659566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76636db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76836db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7706831982aSBarry Smith } 77144cd7ae7SLois Curfman McInnes #else 7729566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 77344cd7ae7SLois Curfman McInnes #endif 77444cd7ae7SLois Curfman McInnes } 7759566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77644cd7ae7SLois Curfman McInnes } 7779566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 778fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 77997f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7819566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 782496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 783496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 78460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 785496be53dSLois Curfman McInnes if (a->j[j] >= i) { 786aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78736db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 788496be53dSLois Curfman McInnes #else 789496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 790496be53dSLois Curfman McInnes #endif 791496be53dSLois Curfman McInnes } 792496be53dSLois Curfman McInnes } 793496be53dSLois Curfman McInnes } 7942e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7962e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7972205254eSKarl Rupp if (i + 4 < m) { 7989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 7992205254eSKarl Rupp } else if (i + 3 < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 8012205254eSKarl Rupp } else if (i + 2 < m) { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 8032205254eSKarl Rupp } else if (i + 1 < m) { 8049566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 8052205254eSKarl Rupp } else if (i < m) { 8069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8072205254eSKarl Rupp } else { 8089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8092205254eSKarl Rupp } 810496be53dSLois Curfman McInnes } 8119566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8129566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 813496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8159566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 816496be53dSLois Curfman McInnes } 8179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 818496be53dSLois Curfman McInnes } 8199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 820496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 82160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 822496be53dSLois Curfman McInnes if (a->j[j] >= i) { 823aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 82448a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 825496be53dSLois Curfman McInnes #else 8269566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 827496be53dSLois Curfman McInnes #endif 828496be53dSLois Curfman McInnes } 829496be53dSLois Curfman McInnes } 8309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 831496be53dSLois Curfman McInnes } 8329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 833fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 83497f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 83587828ca2SBarry Smith PetscScalar value; 83668f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83768f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83868f1ed48SBarry Smith 83968f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 84068f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 84168f1ed48SBarry Smith realonly = PETSC_FALSE; 84268f1ed48SBarry Smith break; 84368f1ed48SBarry Smith } 84468f1ed48SBarry Smith } 84568f1ed48SBarry Smith #endif 84602594712SBarry Smith 8479566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84802594712SBarry Smith for (i = 0; i < m; i++) { 84902594712SBarry Smith jcnt = 0; 850d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 851e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 85202594712SBarry Smith value = a->a[cnt++]; 853e24b481bSBarry Smith jcnt++; 85402594712SBarry Smith } else { 85502594712SBarry Smith value = 0.0; 85602594712SBarry Smith } 857aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85868f1ed48SBarry Smith if (realonly) { 8599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 86068f1ed48SBarry Smith } else { 8619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 86268f1ed48SBarry Smith } 86302594712SBarry Smith #else 8649566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 86502594712SBarry Smith #endif 86602594712SBarry Smith } 8679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86802594712SBarry Smith } 8699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8703c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 871150b93efSMatthew G. Knepley PetscInt fshift = 1; 8729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8733c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8753c215bfdSMatthew Knepley #else 8769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8773c215bfdSMatthew Knepley #endif 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8793c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 88060e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8813c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8833c215bfdSMatthew Knepley #else 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8853c215bfdSMatthew Knepley #endif 8863c215bfdSMatthew Knepley } 8873c215bfdSMatthew Knepley } 8889566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8893a40ed3dSBarry Smith } else { 8909566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 891d5f3da31SBarry Smith if (A->factortype) { 892421480d9SBarry Smith const PetscInt *adiag; 893421480d9SBarry Smith 894421480d9SBarry Smith PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &adiag, NULL)); 89516cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 89716cd7e1dSShri Abhyankar /* L part */ 89860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89916cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 90016cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9019566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 90216cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 90416cd7e1dSShri Abhyankar } else { 9059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 90616cd7e1dSShri Abhyankar } 90716cd7e1dSShri Abhyankar #else 9089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90916cd7e1dSShri Abhyankar #endif 91016cd7e1dSShri Abhyankar } 91116cd7e1dSShri Abhyankar /* diagonal */ 912421480d9SBarry Smith j = adiag[i]; 91316cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91416cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 915835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1 / a->a[j]), (double)PetscImaginaryPart(1 / a->a[j]))); 91616cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 917835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1 / a->a[j]), (double)(-PetscImaginaryPart(1 / a->a[j])))); 91816cd7e1dSShri Abhyankar } else { 919835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1 / a->a[j]))); 92016cd7e1dSShri Abhyankar } 92116cd7e1dSShri Abhyankar #else 922835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1 / a->a[j]))); 92316cd7e1dSShri Abhyankar #endif 92416cd7e1dSShri Abhyankar 92516cd7e1dSShri Abhyankar /* U part */ 926421480d9SBarry Smith for (j = adiag[i + 1] + 1; j < adiag[i]; j++) { 92716cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 92816cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 93016cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 93216cd7e1dSShri Abhyankar } else { 9339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 93416cd7e1dSShri Abhyankar } 93516cd7e1dSShri Abhyankar #else 9369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 93716cd7e1dSShri Abhyankar #endif 93816cd7e1dSShri Abhyankar } 9399566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 94016cd7e1dSShri Abhyankar } 94116cd7e1dSShri Abhyankar } else { 94217ab2063SBarry Smith for (i = 0; i < m; i++) { 9439566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 94460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 945aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 94636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9479566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 94836db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9503a40ed3dSBarry Smith } else { 9519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 95217ab2063SBarry Smith } 95317ab2063SBarry Smith #else 9549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 95517ab2063SBarry Smith #endif 95617ab2063SBarry Smith } 9579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 95817ab2063SBarry Smith } 95916cd7e1dSShri Abhyankar } 9609566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 96117ab2063SBarry Smith } 9629566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 964416022c9SBarry Smith } 965416022c9SBarry Smith 9669804daf3SBarry Smith #include <petscdraw.h> 967ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 968d71ae5a4SJacob Faibussowitsch { 969480ef9eaSBarry Smith Mat A = (Mat)Aa; 970416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 971383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 972383922c3SLisandro Dalcin int color; 973b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 974b0a32e0cSBarry Smith PetscViewer viewer; 975f3ef73ceSBarry Smith PetscViewerFormat format; 976fff043a9SJunchao Zhang const PetscScalar *aa; 977cddf8d76SBarry Smith 9783a40ed3dSBarry Smith PetscFunctionBegin; 9799566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9809566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9819566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 982383922c3SLisandro Dalcin 983416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 985fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 986d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9870513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 988b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 989416022c9SBarry Smith for (i = 0; i < m; i++) { 9909371c9d4SSatish Balay y_l = m - i - 1.0; 9919371c9d4SSatish Balay y_r = y_l + 1.0; 992bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9939371c9d4SSatish Balay x_l = a->j[j]; 9949371c9d4SSatish Balay x_r = x_l + 1.0; 995fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9969566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 997cddf8d76SBarry Smith } 998cddf8d76SBarry Smith } 999b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 1000cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10019371c9d4SSatish Balay y_l = m - i - 1.0; 10029371c9d4SSatish Balay y_r = y_l + 1.0; 1003bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10049371c9d4SSatish Balay x_l = a->j[j]; 10059371c9d4SSatish Balay x_r = x_l + 1.0; 1006fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10079566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1008cddf8d76SBarry Smith } 1009cddf8d76SBarry Smith } 1010b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1011cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10129371c9d4SSatish Balay y_l = m - i - 1.0; 10139371c9d4SSatish Balay y_r = y_l + 1.0; 1014bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10159371c9d4SSatish Balay x_l = a->j[j]; 10169371c9d4SSatish Balay x_r = x_l + 1.0; 1017fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10189566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1019416022c9SBarry Smith } 1020416022c9SBarry Smith } 1021d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10220513a670SBarry Smith } else { 10230513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10240513a670SBarry Smith /* first determine max of all nonzero values */ 1025b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1026383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1027b0a32e0cSBarry Smith PetscDraw popup; 10280513a670SBarry Smith 10290513a670SBarry Smith for (i = 0; i < nz; i++) { 1030fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10310513a670SBarry Smith } 1032383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10339566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10349566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1035383922c3SLisandro Dalcin 1036d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10370513a670SBarry Smith for (i = 0; i < m; i++) { 1038383922c3SLisandro Dalcin y_l = m - i - 1.0; 1039383922c3SLisandro Dalcin y_r = y_l + 1.0; 1040bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1041383922c3SLisandro Dalcin x_l = a->j[j]; 1042383922c3SLisandro Dalcin x_r = x_l + 1.0; 1043fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10449566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10450513a670SBarry Smith count++; 10460513a670SBarry Smith } 10470513a670SBarry Smith } 1048d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10490513a670SBarry Smith } 10509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 10513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1052480ef9eaSBarry Smith } 1053cddf8d76SBarry Smith 10549804daf3SBarry Smith #include <petscdraw.h> 1055ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1056d71ae5a4SJacob Faibussowitsch { 1057b0a32e0cSBarry Smith PetscDraw draw; 105836db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1059ace3abfcSBarry Smith PetscBool isnull; 1060480ef9eaSBarry Smith 1061480ef9eaSBarry Smith PetscFunctionBegin; 10629566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10639566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 10643ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 1065480ef9eaSBarry Smith 10669371c9d4SSatish Balay xr = A->cmap->n; 10679371c9d4SSatish Balay yr = A->rmap->n; 10689371c9d4SSatish Balay h = yr / 10.0; 10699371c9d4SSatish Balay w = xr / 10.0; 10709371c9d4SSatish Balay xr += w; 10719371c9d4SSatish Balay yr += h; 10729371c9d4SSatish Balay xl = -w; 10739371c9d4SSatish Balay yl = -h; 10749566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10759566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10769566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10779566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10789566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1080416022c9SBarry Smith } 1081416022c9SBarry Smith 1082d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1083d71ae5a4SJacob Faibussowitsch { 10849f196a02SMartin Diehl PetscBool isascii, isbinary, isdraw; 1085416022c9SBarry Smith 10863a40ed3dSBarry Smith PetscFunctionBegin; 10879f196a02SMartin Diehl PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &isascii)); 10889566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10899566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10909f196a02SMartin Diehl if (isascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10911baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10921baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10939566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 109517ab2063SBarry Smith } 109619bcc07fSBarry Smith 1097d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1098d71ae5a4SJacob Faibussowitsch { 1099416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1100580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 110107425a8dSBarry Smith PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0; 110254f21887SBarry Smith MatScalar *aa = a->a, *ap; 11033447b6efSHong Zhang PetscReal ratio = 0.6; 110417ab2063SBarry Smith 11053a40ed3dSBarry Smith PetscFunctionBegin; 11063ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 1107b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 110855a7f34eSJunchao Zhang /* we need to respect users asking to use or not the inodes routine in between matrix assemblies, e.g., via MatSetOption(A, MAT_USE_INODES, val) */ 110955a7f34eSJunchao Zhang PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); /* read the sparsity pattern */ 11103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1111b215bc84SStefano Zampini } 111217ab2063SBarry Smith 111343ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 111417ab2063SBarry Smith for (i = 1; i < m; i++) { 1115416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 111617ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 111794a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111817ab2063SBarry Smith if (fshift) { 1119bfeeae90SHong Zhang ip = aj + ai[i]; 1120bfeeae90SHong Zhang ap = aa + ai[i]; 112117ab2063SBarry Smith N = ailen[i]; 11229566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 112348a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 112417ab2063SBarry Smith } 112517ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 112617ab2063SBarry Smith } 112717ab2063SBarry Smith if (m) { 112817ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112917ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 113017ab2063SBarry Smith } 113117ab2063SBarry Smith /* reset ilen and imax for each row */ 11327b083b7cSBarry Smith a->nonzerorowcnt = 0; 1133396832f4SHong Zhang if (A->structure_only) { 11349566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11359566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1136396832f4SHong Zhang } else { /* !A->structure_only */ 113717ab2063SBarry Smith for (i = 0; i < m; i++) { 113817ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11397b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 114017ab2063SBarry Smith } 1141396832f4SHong Zhang } 1142bfeeae90SHong Zhang a->nz = ai[m]; 1143aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 11449566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11459566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11469566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11472205254eSKarl Rupp 11488e58a170SBarry Smith A->info.mallocs += a->reallocs; 1149dd5f02e7SSatish Balay a->reallocs = 0; 11506712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 115136db0b34SBarry Smith a->rmax = rmax; 11524e220ebcSLois Curfman McInnes 115348a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11549566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 115617ab2063SBarry Smith } 115717ab2063SBarry Smith 1158ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1159d71ae5a4SJacob Faibussowitsch { 116099cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 116199cafbc1SBarry Smith PetscInt i, nz = a->nz; 11622e5835c6SStefano Zampini MatScalar *aa; 116399cafbc1SBarry Smith 116499cafbc1SBarry Smith PetscFunctionBegin; 11659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 116699cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 116999cafbc1SBarry Smith } 117099cafbc1SBarry Smith 1171ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1172d71ae5a4SJacob Faibussowitsch { 117399cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 117499cafbc1SBarry Smith PetscInt i, nz = a->nz; 11752e5835c6SStefano Zampini MatScalar *aa; 117699cafbc1SBarry Smith 117799cafbc1SBarry Smith PetscFunctionBegin; 11789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117999cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 118299cafbc1SBarry Smith } 118399cafbc1SBarry Smith 1184d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1185d71ae5a4SJacob Faibussowitsch { 1186fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1187fff043a9SJunchao Zhang MatScalar *aa; 11883a40ed3dSBarry Smith 11893a40ed3dSBarry Smith PetscFunctionBegin; 11909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 11919566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 11929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 11933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119417ab2063SBarry Smith } 1195416022c9SBarry Smith 1196674b392bSAlexander static PetscErrorCode MatReset_SeqAIJ(Mat A) 1197d71ae5a4SJacob Faibussowitsch { 1198416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1199d5d45c9bSBarry Smith 12003a40ed3dSBarry Smith PetscFunctionBegin; 1201b4e2f619SBarry Smith if (A->hash_active) { 1202e3c72094SPierre Jolivet A->ops[0] = a->cops; 1203b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 1204b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 1205b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 1206b4e2f619SBarry Smith } 1207b4e2f619SBarry Smith 12083ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz)); 12099566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12109566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12119566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12129566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12139566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12149566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12159566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12169566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12179566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12189566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12199566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12209566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 1221820d003aSStefano Zampini a->compressedrow.use = PETSC_FALSE; 12229566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12239566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 1224674b392bSAlexander PetscFunctionReturn(PETSC_SUCCESS); 1225674b392bSAlexander } 1226674b392bSAlexander 1227674b392bSAlexander static PetscErrorCode MatResetHash_SeqAIJ(Mat A) 1228674b392bSAlexander { 1229674b392bSAlexander PetscFunctionBegin; 1230674b392bSAlexander PetscCall(MatReset_SeqAIJ(A)); 1231674b392bSAlexander PetscCall(MatCreate_SeqAIJ_Inode(A)); 1232674b392bSAlexander PetscCall(MatSetUp_Seq_Hash(A)); 1233674b392bSAlexander A->nonzerostate++; 1234674b392bSAlexander PetscFunctionReturn(PETSC_SUCCESS); 1235674b392bSAlexander } 1236674b392bSAlexander 1237674b392bSAlexander PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1238674b392bSAlexander { 1239674b392bSAlexander PetscFunctionBegin; 1240674b392bSAlexander PetscCall(MatReset_SeqAIJ(A)); 12419566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1242901853e0SKris Buschelman 12436718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12446718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12456718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12466718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12476718818eSStefano Zampini due to different matrix sizes */ 12489566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12496718818eSStefano Zampini 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12512e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12522e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12592e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12602e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12612e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12622e956fe4SStefano Zampini #endif 12634222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12674222ddf1SHong Zhang #endif 1268d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 1269d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL)); 1270d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL)); 1271d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL)); 1272d5e393b6SSuyash Tandon #endif 12733d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12753d0639e7SStefano Zampini #endif 12769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1277af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1279af8000cdSHong Zhang #endif 1280d1a032dbSPierre Jolivet #if defined(PETSC_HAVE_SCALAPACK) && (defined(PETSC_USE_REAL_SINGLE) || defined(PETSC_USE_REAL_DOUBLE)) 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1282d24d4204SJose E. Roman #endif 128363c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 128663c07aadSStefano Zampini #endif 12879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12912e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 1294674b392bSAlexander PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetHash_C", NULL)); 12959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12989566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12999566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 13009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 13019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 13029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 13032e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 13042e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 13052e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 13062e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 13072e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 13082e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 13092e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 13103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 131117ab2063SBarry Smith } 131217ab2063SBarry Smith 1313d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1314d71ae5a4SJacob Faibussowitsch { 1315416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13163a40ed3dSBarry Smith 13173a40ed3dSBarry Smith PetscFunctionBegin; 1318a65d3064SKris Buschelman switch (op) { 1319d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1320d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1321d71ae5a4SJacob Faibussowitsch break; 1322d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1323d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1324d71ae5a4SJacob Faibussowitsch break; 1325d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1326d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1327d71ae5a4SJacob Faibussowitsch break; 1328d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1329d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1330d71ae5a4SJacob Faibussowitsch break; 1331d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1332d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1333d71ae5a4SJacob Faibussowitsch break; 1334d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1335d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1336d71ae5a4SJacob Faibussowitsch break; 1337d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1338d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1339d71ae5a4SJacob Faibussowitsch break; 1340d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1341d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1342d71ae5a4SJacob Faibussowitsch break; 1343d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1344d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1345d71ae5a4SJacob Faibussowitsch break; 1346071fcb05SBarry Smith case MAT_SORTED_FULL: 1347071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1348071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1349071fcb05SBarry Smith break; 1350d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1351d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1352d71ae5a4SJacob Faibussowitsch break; 1353d71ae5a4SJacob Faibussowitsch default: 1354888c827cSStefano Zampini break; 1355a65d3064SKris Buschelman } 13563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 135717ab2063SBarry Smith } 135817ab2063SBarry Smith 13599ee18893SBarry Smith PETSC_INTERN PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1360d71ae5a4SJacob Faibussowitsch { 1361416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1362421480d9SBarry Smith PetscInt n, *ai = a->i; 1363c898d852SStefano Zampini PetscScalar *x; 1364c898d852SStefano Zampini const PetscScalar *aa; 1365421480d9SBarry Smith const PetscInt *diag; 1366421480d9SBarry Smith PetscBool diagDense; 136717ab2063SBarry Smith 13683a40ed3dSBarry Smith PetscFunctionBegin; 13699566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 137008401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1372d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1373421480d9SBarry Smith PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, NULL)); 13749566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 1375421480d9SBarry Smith for (PetscInt i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13769566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 137935e7444dSHong Zhang } 138035e7444dSHong Zhang 1381421480d9SBarry Smith PetscCheck(A->factortype == MAT_FACTOR_NONE, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Not for factor matrices that are not ILU or LU"); 1382421480d9SBarry Smith PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, &diagDense)); 13839566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 1384421480d9SBarry Smith if (diagDense) { 1385421480d9SBarry Smith for (PetscInt i = 0; i < n; i++) x[i] = aa[diag[i]]; 1386421480d9SBarry Smith } else { 1387421480d9SBarry Smith for (PetscInt i = 0; i < n; i++) x[i] = (diag[i] == ai[i + 1]) ? 0.0 : aa[diag[i]]; 138817ab2063SBarry Smith } 13899566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 139217ab2063SBarry Smith } 139317ab2063SBarry Smith 1394c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1395d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1396d71ae5a4SJacob Faibussowitsch { 1397416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13985f22a7b3SSebastian Grimberg const MatScalar *aa; 1399d9ca1df4SBarry Smith PetscScalar *y; 1400d9ca1df4SBarry Smith const PetscScalar *x; 1401d0f46423SBarry Smith PetscInt m = A->rmap->n; 14025c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14035f22a7b3SSebastian Grimberg const MatScalar *v; 1404a77337e4SBarry Smith PetscScalar alpha; 1405d9ca1df4SBarry Smith PetscInt n, i, j; 1406d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14073447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1408ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14095c897100SBarry Smith #endif 141017ab2063SBarry Smith 14113a40ed3dSBarry Smith PetscFunctionBegin; 14129566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14139566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14149566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14165c897100SBarry Smith 14175c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1418fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14195c897100SBarry Smith #else 14203447b6efSHong Zhang if (usecprow) { 14213447b6efSHong Zhang m = cprow.nrows; 14223447b6efSHong Zhang ii = cprow.i; 14237b2bb3b9SHong Zhang ridx = cprow.rindex; 14243447b6efSHong Zhang } else { 14253447b6efSHong Zhang ii = a->i; 14263447b6efSHong Zhang } 142717ab2063SBarry Smith for (i = 0; i < m; i++) { 14283447b6efSHong Zhang idx = a->j + ii[i]; 1429fff043a9SJunchao Zhang v = aa + ii[i]; 14303447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14313447b6efSHong Zhang if (usecprow) { 14327b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14333447b6efSHong Zhang } else { 143417ab2063SBarry Smith alpha = x[i]; 14353447b6efSHong Zhang } 143604fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 143717ab2063SBarry Smith } 14385c897100SBarry Smith #endif 14399566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14409566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14419566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 144417ab2063SBarry Smith } 144517ab2063SBarry Smith 1446d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1447d71ae5a4SJacob Faibussowitsch { 14485c897100SBarry Smith PetscFunctionBegin; 14499566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14509566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14525c897100SBarry Smith } 14535c897100SBarry Smith 1454c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 145578b84d54SShri Abhyankar 1456d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1457d71ae5a4SJacob Faibussowitsch { 1458416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1459d9fead3dSBarry Smith PetscScalar *y; 146054f21887SBarry Smith const PetscScalar *x; 14615914357eSBarry Smith const MatScalar *a_a; 1462003131ecSBarry Smith PetscInt m = A->rmap->n; 14635914357eSBarry Smith const PetscInt *ii, *ridx = NULL; 1464ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 146517ab2063SBarry Smith 1466b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 146797952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1468fee21e36SBarry Smith #endif 1469fee21e36SBarry Smith 14703a40ed3dSBarry Smith PetscFunctionBegin; 1471b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14729566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 14733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1474b215bc84SStefano Zampini } 14759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14769566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14779566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1478416022c9SBarry Smith ii = a->i; 14794eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14809566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 148197952fefSHong Zhang m = a->compressedrow.nrows; 148297952fefSHong Zhang ii = a->compressedrow.i; 148397952fefSHong Zhang ridx = a->compressedrow.rindex; 14845914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 14855914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 14865914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 14875914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 14885914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 14895914357eSBarry Smith PetscScalar sum = 0.0; 1490003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1491003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1492c9a1b032SJunchao Zhang y[ridx[i]] = sum; 149397952fefSHong Zhang } 149497952fefSHong Zhang } else { /* do not use compressed row format */ 1495b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 14965914357eSBarry Smith fortranmultaij_(&m, x, ii, a->j, a_a, y); 1497b05257ddSBarry Smith #else 14985914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 14995914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 15005914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 15015914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 15025914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 15035914357eSBarry Smith PetscScalar sum = 0.0; 1504003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 150517ab2063SBarry Smith y[i] = sum; 150617ab2063SBarry Smith } 15078d195f9aSBarry Smith #endif 1508b05257ddSBarry Smith } 15099566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15109566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15119566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 151417ab2063SBarry Smith } 151517ab2063SBarry Smith 1516ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1517ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1518d71ae5a4SJacob Faibussowitsch { 1519b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1520b434eb95SMatthew G. Knepley PetscScalar *y; 1521b434eb95SMatthew G. Knepley const PetscScalar *x; 1522fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1523b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1524b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1525b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1526b434eb95SMatthew G. Knepley PetscScalar sum; 1527b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1528b434eb95SMatthew G. Knepley 1529b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1530b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1531b434eb95SMatthew G. Knepley #endif 1532b434eb95SMatthew G. Knepley 1533b434eb95SMatthew G. Knepley PetscFunctionBegin; 15349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15359566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15369566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1537b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1538b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1539b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1540b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1541b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1542b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1543b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1544fff043a9SJunchao Zhang aa = a_a + ii[i]; 1545b434eb95SMatthew G. Knepley sum = 0.0; 1546b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1547b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1548b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1549b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1550b434eb95SMatthew G. Knepley } 1551b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15523d3eaba7SBarry Smith ii = a->i; 1553b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1554b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1555b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1556fff043a9SJunchao Zhang aa = a_a + ii[i]; 1557b434eb95SMatthew G. Knepley sum = 0.0; 1558b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1559b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1560b434eb95SMatthew G. Knepley y[i] = sum; 1561b434eb95SMatthew G. Knepley } 1562b434eb95SMatthew G. Knepley } 15639566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15649566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15659566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1568b434eb95SMatthew G. Knepley } 1569b434eb95SMatthew G. Knepley 1570ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1571ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1572d71ae5a4SJacob Faibussowitsch { 1573b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1574b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1575b434eb95SMatthew G. Knepley const PetscScalar *x; 1576fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1577b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1578b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1579b434eb95SMatthew G. Knepley PetscScalar sum; 1580b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1581b434eb95SMatthew G. Knepley 1582b434eb95SMatthew G. Knepley PetscFunctionBegin; 15839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15849566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15859566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1586b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 158748a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1588b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1589b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1590b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1591b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1592b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1593b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1594fff043a9SJunchao Zhang aa = a_a + ii[i]; 1595b434eb95SMatthew G. Knepley sum = y[*ridx]; 1596b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1597b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1598b434eb95SMatthew G. Knepley } 1599b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16003d3eaba7SBarry Smith ii = a->i; 1601b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1602b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1603b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1604fff043a9SJunchao Zhang aa = a_a + ii[i]; 1605b434eb95SMatthew G. Knepley sum = y[i]; 1606b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1607b434eb95SMatthew G. Knepley z[i] = sum; 1608b434eb95SMatthew G. Knepley } 1609b434eb95SMatthew G. Knepley } 16109566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16119566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16129566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1615b434eb95SMatthew G. Knepley } 1616b434eb95SMatthew G. Knepley 1617c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1618d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1619d71ae5a4SJacob Faibussowitsch { 1620416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1621f15663dcSBarry Smith PetscScalar *y, *z; 1622f15663dcSBarry Smith const PetscScalar *x; 16235914357eSBarry Smith const MatScalar *a_a; 16245914357eSBarry Smith const PetscInt *ii, *ridx = NULL; 16255914357eSBarry Smith PetscInt m = A->rmap->n; 1626ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16279ea0dfa2SSatish Balay 16283a40ed3dSBarry Smith PetscFunctionBegin; 1629b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16309566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 16313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1632b215bc84SStefano Zampini } 16339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16349566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16359566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16364eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 163748a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 163897952fefSHong Zhang m = a->compressedrow.nrows; 163997952fefSHong Zhang ii = a->compressedrow.i; 164097952fefSHong Zhang ridx = a->compressedrow.rindex; 16415914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 16425914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 16435914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 16445914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 16455914357eSBarry Smith PetscScalar sum = y[*ridx]; 1646f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 164797952fefSHong Zhang z[*ridx++] = sum; 164897952fefSHong Zhang } 164997952fefSHong Zhang } else { /* do not use compressed row format */ 16503d3eaba7SBarry Smith ii = a->i; 1651f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16525914357eSBarry Smith fortranmultaddaij_(&m, x, ii, a->j, a_a, y, z); 1653f15663dcSBarry Smith #else 16545914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 16555914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 16565914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 16575914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 16585914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 16595914357eSBarry Smith PetscScalar sum = y[i]; 1660f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 166117ab2063SBarry Smith z[i] = sum; 166217ab2063SBarry Smith } 166302ab625aSSatish Balay #endif 1664f15663dcSBarry Smith } 16659566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16669566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16679566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 167017ab2063SBarry Smith } 167117ab2063SBarry Smith 1672ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1673d71ae5a4SJacob Faibussowitsch { 167461ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1675421480d9SBarry Smith const PetscInt *diag; 167661ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 1677421480d9SBarry Smith PetscBool diagDense; 167861ecd0c6SBarry Smith 167961ecd0c6SBarry Smith PetscFunctionBegin; 168061ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 16819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 16829566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 16833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 168461ecd0c6SBarry Smith } 168561ecd0c6SBarry Smith 1686421480d9SBarry Smith PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, &diagDense)); 1687421480d9SBarry Smith if (diagDense) { 16889234b629SBarry Smith PetscScalar *Aa; 16899234b629SBarry Smith 16909234b629SBarry Smith PetscCall(MatSeqAIJGetArray(A, &Aa)); 16919234b629SBarry Smith for (PetscInt i = 0; i < A->rmap->n; i++) Aa[diag[i]] += v; 16929234b629SBarry Smith PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 169361ecd0c6SBarry Smith } else { 1694b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1695b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 16969f0612e4SBarry Smith PetscBool free_a = a->free_a, free_ij = a->free_ij; 16976ea2a7edSJunchao Zhang const PetscScalar *Aa; 169807425a8dSBarry Smith PetscInt *mdiag = NULL; 16996ea2a7edSJunchao Zhang 170007425a8dSBarry Smith PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 170107425a8dSBarry Smith for (PetscInt i = 0; i < A->rmap->n; i++) { 170207425a8dSBarry Smith if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 170307425a8dSBarry Smith mdiag[i] = 1; 170407425a8dSBarry Smith } 170507425a8dSBarry Smith } 17066ea2a7edSJunchao Zhang PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host 17076ea2a7edSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa)); 170861ecd0c6SBarry Smith 170961ecd0c6SBarry Smith a->a = NULL; 171061ecd0c6SBarry Smith a->j = NULL; 171161ecd0c6SBarry Smith a->i = NULL; 171261ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 171307425a8dSBarry Smith for (PetscInt i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 171561ecd0c6SBarry Smith 171661ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 171707425a8dSBarry Smith for (PetscInt i = 0; i < A->rmap->n; i++) { 17189566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 171948a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1720447d62f5SStefano Zampini } 17219566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17229566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 17239f0612e4SBarry Smith if (free_a) PetscCall(PetscShmgetDeallocateArray((void **)&olda)); 17249f0612e4SBarry Smith if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldj)); 17259f0612e4SBarry Smith if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldi)); 17269566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 1727be5855fcSBarry Smith } 17283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1729be5855fcSBarry Smith } 1730be5855fcSBarry Smith 17310da83c2eSBarry Smith #include <petscblaslapack.h> 17320da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 17330da83c2eSBarry Smith 17340da83c2eSBarry Smith /* 17350da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 17360da83c2eSBarry Smith */ 1737ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1738d71ae5a4SJacob Faibussowitsch { 17390da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 17400da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 17410da83c2eSBarry Smith const PetscReal shift = 0.0; 17420da83c2eSBarry Smith PetscInt ipvt[5]; 17434e208921SJed Brown PetscCount flops = 0; 17440da83c2eSBarry Smith PetscScalar work[25], *v_work; 17450da83c2eSBarry Smith 17460da83c2eSBarry Smith PetscFunctionBegin; 17470da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 17480da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 174908401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1750ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 17519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 175248a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 17530da83c2eSBarry Smith ncnt = 0; 17540da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 17550da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 17569566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 17570da83c2eSBarry Smith switch (bsizes[i]) { 1758d71ae5a4SJacob Faibussowitsch case 1: 1759d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1760d71ae5a4SJacob Faibussowitsch break; 17610da83c2eSBarry Smith case 2: 17629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 17630da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17649566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 17650da83c2eSBarry Smith break; 17660da83c2eSBarry Smith case 3: 17679566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 17680da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17699566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 17700da83c2eSBarry Smith break; 17710da83c2eSBarry Smith case 4: 17729566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 17730da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17749566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 17750da83c2eSBarry Smith break; 17760da83c2eSBarry Smith case 5: 17779566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 17780da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17799566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 17800da83c2eSBarry Smith break; 17810da83c2eSBarry Smith case 6: 17829566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 17830da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17849566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 17850da83c2eSBarry Smith break; 17860da83c2eSBarry Smith case 7: 17879566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 17880da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17899566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 17900da83c2eSBarry Smith break; 17910da83c2eSBarry Smith default: 17929566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 17930da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17949566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 17950da83c2eSBarry Smith } 17960da83c2eSBarry Smith ncnt += bsizes[i]; 17970da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 1798baa50dc0SBrad Aagaard flops += 2 * PetscPowInt64(bsizes[i], 3) / 3; 17990da83c2eSBarry Smith } 18003ba16761SJacob Faibussowitsch PetscCall(PetscLogFlops(flops)); 180148a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18029566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18040da83c2eSBarry Smith } 18050da83c2eSBarry Smith 1806422a814eSBarry Smith /* 1807422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1808422a814eSBarry Smith */ 180907425a8dSBarry Smith static PetscErrorCode MatInvertDiagonalForSOR_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1810d71ae5a4SJacob Faibussowitsch { 181171f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1812421480d9SBarry Smith PetscInt i, m = A->rmap->n; 18132e5835c6SStefano Zampini const MatScalar *v; 181454f21887SBarry Smith PetscScalar *idiag, *mdiag; 1815421480d9SBarry Smith PetscBool diagDense; 1816421480d9SBarry Smith const PetscInt *diag; 181771f1c65dSBarry Smith 181871f1c65dSBarry Smith PetscFunctionBegin; 181907425a8dSBarry Smith if (a->idiagState == ((PetscObject)A)->state && a->omega == omega && a->fshift == fshift) PetscFunctionReturn(PETSC_SUCCESS); 1820421480d9SBarry Smith PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, &diagDense)); 1821421480d9SBarry Smith PetscCheck(diagDense, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix must have all diagonal locations to invert them"); 18223a7d0413SPierre Jolivet if (!a->idiag) PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); 18232e5835c6SStefano Zampini 182471f1c65dSBarry Smith mdiag = a->mdiag; 182571f1c65dSBarry Smith idiag = a->idiag; 18269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1827422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 182871f1c65dSBarry Smith for (i = 0; i < m; i++) { 182971f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1830899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1831966bd95aSPierre Jolivet PetscCheck(PetscRealPart(fshift), PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 18329566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 18337b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18347b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 18357b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 1836899639b0SHong Zhang } 183771f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 183871f1c65dSBarry Smith } 18399566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 184071f1c65dSBarry Smith } else { 184171f1c65dSBarry Smith for (i = 0; i < m; i++) { 184271f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 184371f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 184471f1c65dSBarry Smith } 18459566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 184671f1c65dSBarry Smith } 18479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 184807425a8dSBarry Smith a->idiagState = ((PetscObject)A)->state; 184907425a8dSBarry Smith a->omega = omega; 185007425a8dSBarry Smith a->fshift = fshift; 18513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 185271f1c65dSBarry Smith } 185371f1c65dSBarry Smith 1854d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1855d71ae5a4SJacob Faibussowitsch { 1856416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1857e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 18582e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 185954f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 18603d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 186197f1f81fSBarry Smith const PetscInt *idx, *diag; 186217ab2063SBarry Smith 18633a40ed3dSBarry Smith PetscFunctionBegin; 1864b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 18659566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 18663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1867b215bc84SStefano Zampini } 1868b965ef7fSBarry Smith its = its * lits; 186907425a8dSBarry Smith PetscCall(MatInvertDiagonalForSOR_SeqAIJ(A, omega, fshift)); 1870421480d9SBarry Smith PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, NULL)); 187171f1c65dSBarry Smith t = a->ssor_work; 1872ed480e8bSBarry Smith idiag = a->idiag; 187371f1c65dSBarry Smith mdiag = a->mdiag; 1874ed480e8bSBarry Smith 18759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 18769566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 18779566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1878ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 187917ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 188017ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1881ed480e8bSBarry Smith bs = b; 188217ab2063SBarry Smith for (i = 0; i < m; i++) { 188371f1c65dSBarry Smith d = fshift + mdiag[i]; 1884416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1885ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 18862e5835c6SStefano Zampini v = aa + diag[i] + 1; 188717ab2063SBarry Smith sum = b[i] * d / omega; 1888003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 188917ab2063SBarry Smith x[i] = sum; 189017ab2063SBarry Smith } 18919566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 18929566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 18939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 18949566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 18953ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 189617ab2063SBarry Smith } 1897c783ea89SBarry Smith 189808401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1899f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19004c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1901887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 190217ab2063SBarry Smith 190317ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 190417ab2063SBarry Smith 1905887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 190617ab2063SBarry Smith */ 190717ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 190817ab2063SBarry Smith 190917ab2063SBarry Smith /* x = (E + U)^{-1} b */ 191017ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1911416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1912ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19132e5835c6SStefano Zampini v = aa + diag[i] + 1; 191417ab2063SBarry Smith sum = b[i]; 1915e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1916ed480e8bSBarry Smith x[i] = sum * idiag[i]; 191717ab2063SBarry Smith } 191817ab2063SBarry Smith 191917ab2063SBarry Smith /* t = b - (2*E - D)x */ 19202e5835c6SStefano Zampini v = aa; 19212205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 192217ab2063SBarry Smith 192317ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1924ed480e8bSBarry Smith ts = t; 1925416022c9SBarry Smith diag = a->diag; 192617ab2063SBarry Smith for (i = 0; i < m; i++) { 1927416022c9SBarry Smith n = diag[i] - a->i[i]; 1928ed480e8bSBarry Smith idx = a->j + a->i[i]; 19292e5835c6SStefano Zampini v = aa + a->i[i]; 193017ab2063SBarry Smith sum = t[i]; 1931003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 1932ed480e8bSBarry Smith t[i] = sum * idiag[i]; 1933733d66baSBarry Smith /* x = x + t */ 1934733d66baSBarry Smith x[i] += t[i]; 193517ab2063SBarry Smith } 193617ab2063SBarry Smith 19379566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 19389566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19399566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 194117ab2063SBarry Smith } 194217ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 194317ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 194417ab2063SBarry Smith for (i = 0; i < m; i++) { 1945416022c9SBarry Smith n = diag[i] - a->i[i]; 1946ed480e8bSBarry Smith idx = a->j + a->i[i]; 19472e5835c6SStefano Zampini v = aa + a->i[i]; 194817ab2063SBarry Smith sum = b[i]; 1949e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 19505c99c7daSBarry Smith t[i] = sum; 1951ed480e8bSBarry Smith x[i] = sum * idiag[i]; 195217ab2063SBarry Smith } 19535c99c7daSBarry Smith xb = t; 19549566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19553a40ed3dSBarry Smith } else xb = b; 195617ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 195717ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1958416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1959ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19602e5835c6SStefano Zampini v = aa + diag[i] + 1; 196117ab2063SBarry Smith sum = xb[i]; 1962e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 19635c99c7daSBarry Smith if (xb == b) { 1964ed480e8bSBarry Smith x[i] = sum * idiag[i]; 19655c99c7daSBarry Smith } else { 1966b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 196717ab2063SBarry Smith } 19685c99c7daSBarry Smith } 19699566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 197017ab2063SBarry Smith } 197117ab2063SBarry Smith its--; 197217ab2063SBarry Smith } 197317ab2063SBarry Smith while (its--) { 197417ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 197517ab2063SBarry Smith for (i = 0; i < m; i++) { 1976b19a5dc2SMark Adams /* lower */ 1977b19a5dc2SMark Adams n = diag[i] - a->i[i]; 1978ed480e8bSBarry Smith idx = a->j + a->i[i]; 19792e5835c6SStefano Zampini v = aa + a->i[i]; 198017ab2063SBarry Smith sum = b[i]; 1981e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1982b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 1983b19a5dc2SMark Adams /* upper */ 1984b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 1985b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 19862e5835c6SStefano Zampini v = aa + diag[i] + 1; 1987b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 1988b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 198917ab2063SBarry Smith } 1990b19a5dc2SMark Adams xb = t; 19919566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 1992b19a5dc2SMark Adams } else xb = b; 199317ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 199417ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1995b19a5dc2SMark Adams sum = xb[i]; 1996b19a5dc2SMark Adams if (xb == b) { 1997b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 1998416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 1999ed480e8bSBarry Smith idx = a->j + a->i[i]; 20002e5835c6SStefano Zampini v = aa + a->i[i]; 2001e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2002ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2003b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2004b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2005b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20062e5835c6SStefano Zampini v = aa + diag[i] + 1; 2007b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2008b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 200917ab2063SBarry Smith } 2010b19a5dc2SMark Adams } 2011b19a5dc2SMark Adams if (xb == b) { 20129566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2013b19a5dc2SMark Adams } else { 20149566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2015b19a5dc2SMark Adams } 201617ab2063SBarry Smith } 201717ab2063SBarry Smith } 20189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20199566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20209566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 202217ab2063SBarry Smith } 202317ab2063SBarry Smith 2024ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2025d71ae5a4SJacob Faibussowitsch { 2026416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 20274e220ebcSLois Curfman McInnes 20283a40ed3dSBarry Smith PetscFunctionBegin; 20294e220ebcSLois Curfman McInnes info->block_size = 1.0; 20303966268fSBarry Smith info->nz_allocated = a->maxnz; 20313966268fSBarry Smith info->nz_used = a->nz; 20323966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 20333966268fSBarry Smith info->assemblies = A->num_ass; 20343966268fSBarry Smith info->mallocs = A->info.mallocs; 20354dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2036d5f3da31SBarry Smith if (A->factortype) { 20374e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 20384e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 20394e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 20404e220ebcSLois Curfman McInnes } else { 20414e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 20424e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 20434e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 20444e220ebcSLois Curfman McInnes } 20453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 204617ab2063SBarry Smith } 204717ab2063SBarry Smith 2048421480d9SBarry Smith static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diagv, Vec x, Vec b) 2049d71ae5a4SJacob Faibussowitsch { 2050416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2051c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 205297b48c8fSBarry Smith const PetscScalar *xx; 20532e5835c6SStefano Zampini PetscScalar *bb, *aa; 2054c7da8527SEric Chamberland PetscInt d = 0; 2055421480d9SBarry Smith const PetscInt *diag; 205617ab2063SBarry Smith 20573a40ed3dSBarry Smith PetscFunctionBegin; 205897b48c8fSBarry Smith if (x && b) { 20599566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 20609566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 206197b48c8fSBarry Smith for (i = 0; i < N; i++) { 2062aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2063447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 2064421480d9SBarry Smith bb[rows[i]] = diagv * xx[rows[i]]; 206597b48c8fSBarry Smith } 20669566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 20679566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 206897b48c8fSBarry Smith } 206997b48c8fSBarry Smith 2070421480d9SBarry Smith PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, NULL)); 20719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2072a9817697SBarry Smith if (a->keepnonzeropattern) { 2073f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2074aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 20759566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2076f1e2ffcdSBarry Smith } 2077421480d9SBarry Smith if (diagv != 0.0) { 2078c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2079c7da8527SEric Chamberland d = rows[i]; 2080421480d9SBarry Smith if (d >= A->cmap->n) continue; 2081421480d9SBarry Smith PetscCheck(diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 20829234b629SBarry Smith aa[diag[d]] = diagv; 2083f1e2ffcdSBarry Smith } 2084f1e2ffcdSBarry Smith } 2085f1e2ffcdSBarry Smith } else { 2086421480d9SBarry Smith if (diagv != 0.0) { 208717ab2063SBarry Smith for (i = 0; i < N; i++) { 2088aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 20897ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2090447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2091447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2092447d62f5SStefano Zampini } else { 2093416022c9SBarry Smith a->ilen[rows[i]] = 1; 2094421480d9SBarry Smith aa[a->i[rows[i]]] = diagv; 2095bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2096447d62f5SStefano Zampini } 2097447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 2098421480d9SBarry Smith PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diagv, INSERT_VALUES)); 209917ab2063SBarry Smith } 210017ab2063SBarry Smith } 21013a40ed3dSBarry Smith } else { 210217ab2063SBarry Smith for (i = 0; i < N; i++) { 2103aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2104416022c9SBarry Smith a->ilen[rows[i]] = 0; 210517ab2063SBarry Smith } 210617ab2063SBarry Smith } 2107e56f5c9eSBarry Smith A->nonzerostate++; 2108f1e2ffcdSBarry Smith } 21099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2110dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 211217ab2063SBarry Smith } 211317ab2063SBarry Smith 2114421480d9SBarry Smith static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diagv, Vec x, Vec b) 2115d71ae5a4SJacob Faibussowitsch { 21166e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21176e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 2118421480d9SBarry Smith PetscBool *zeroed, vecs = PETSC_FALSE; 21196e169961SBarry Smith const PetscScalar *xx; 21202e5835c6SStefano Zampini PetscScalar *bb, *aa; 2121421480d9SBarry Smith const PetscInt *diag; 2122421480d9SBarry Smith PetscBool diagDense; 21236e169961SBarry Smith 21246e169961SBarry Smith PetscFunctionBegin; 21253ba16761SJacob Faibussowitsch if (!N) PetscFunctionReturn(PETSC_SUCCESS); 2126421480d9SBarry Smith PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, &diagDense)); 21279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 21286e169961SBarry Smith if (x && b) { 21299566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21309566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 21312b40b63fSBarry Smith vecs = PETSC_TRUE; 21326e169961SBarry Smith } 21339566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 21346e169961SBarry Smith for (i = 0; i < N; i++) { 2135aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21368e3a54c0SPierre Jolivet PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]])); 21372205254eSKarl Rupp 21386e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 21396e169961SBarry Smith } 21406e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 21416e169961SBarry Smith if (!zeroed[i]) { 21426e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 21434cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 21442e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 21452e5835c6SStefano Zampini aa[j] = 0.0; 21466e169961SBarry Smith } 21476e169961SBarry Smith } 2148421480d9SBarry Smith } else if (vecs && i < A->cmap->N) bb[i] = diagv * xx[i]; 21496e169961SBarry Smith } 21506e169961SBarry Smith if (x && b) { 21519566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21529566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 21536e169961SBarry Smith } 21549566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 2155421480d9SBarry Smith if (diagv != 0.0) { 2156421480d9SBarry Smith if (!diagDense) { 21571d5a398dSstefano_zampini for (i = 0; i < N; i++) { 21584cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2159aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 2160421480d9SBarry Smith PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diagv, INSERT_VALUES)); 21611d5a398dSstefano_zampini } 21621d5a398dSstefano_zampini } else { 2163421480d9SBarry Smith for (i = 0; i < N; i++) aa[diag[rows[i]]] = diagv; 21646e169961SBarry Smith } 21651d5a398dSstefano_zampini } 21669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 21679234b629SBarry Smith if (!diagDense) PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 21696e169961SBarry Smith } 21706e169961SBarry Smith 2171d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2172d71ae5a4SJacob Faibussowitsch { 2173fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2174fff043a9SJunchao Zhang const PetscScalar *aa; 217517ab2063SBarry Smith 21763a40ed3dSBarry Smith PetscFunctionBegin; 21779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2178416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 21798e3a54c0SPierre Jolivet if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]); 218017ab2063SBarry Smith if (idx) { 21815c0db29aSPierre Jolivet if (*nz && a->j) *idx = a->j + a->i[row]; 2182f4259b30SLisandro Dalcin else *idx = NULL; 218317ab2063SBarry Smith } 21849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 21853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 218617ab2063SBarry Smith } 218717ab2063SBarry Smith 2188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2189d71ae5a4SJacob Faibussowitsch { 21903a40ed3dSBarry Smith PetscFunctionBegin; 21913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 219217ab2063SBarry Smith } 219317ab2063SBarry Smith 2194ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2195d71ae5a4SJacob Faibussowitsch { 2196416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21972e5835c6SStefano Zampini const MatScalar *v; 219836db0b34SBarry Smith PetscReal sum = 0.0; 219997f1f81fSBarry Smith PetscInt i, j; 220017ab2063SBarry Smith 22013a40ed3dSBarry Smith PetscFunctionBegin; 22029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 220317ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2204570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2205570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2206792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2207570b7f6dSBarry Smith #else 2208416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22099371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22109371c9d4SSatish Balay v++; 221117ab2063SBarry Smith } 22128f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2213570b7f6dSBarry Smith #endif 22149566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22153a40ed3dSBarry Smith } else if (type == NORM_1) { 221636db0b34SBarry Smith PetscReal *tmp; 221797f1f81fSBarry Smith PetscInt *jj = a->j; 22189566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2219064f8208SBarry Smith *nrm = 0.0; 2220416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 22219371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 22229371c9d4SSatish Balay v++; 222317ab2063SBarry Smith } 2224d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2225064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 222617ab2063SBarry Smith } 22279566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 22289566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 22293a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2230064f8208SBarry Smith *nrm = 0.0; 2231d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 22328e3a54c0SPierre Jolivet const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]); 223317ab2063SBarry Smith sum = 0.0; 2234416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 22359371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 22369371c9d4SSatish Balay v2++; 223717ab2063SBarry Smith } 2238064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 223917ab2063SBarry Smith } 22409566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2241f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 22429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 22433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 224417ab2063SBarry Smith } 224517ab2063SBarry Smith 2246ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2247d71ae5a4SJacob Faibussowitsch { 22483d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 224954f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 22502e5835c6SStefano Zampini const MatScalar *va, *vb; 225197f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2252cd0d46ebSvictorle 2253cd0d46ebSvictorle PetscFunctionBegin; 22549566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 22559566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 22565485867bSBarry Smith if (ma != nb || na != mb) { 22575485867bSBarry Smith *f = PETSC_FALSE; 22583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22595485867bSBarry Smith } 22609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 22619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 22629371c9d4SSatish Balay aii = aij->i; 22639371c9d4SSatish Balay bii = bij->i; 22649371c9d4SSatish Balay adx = aij->j; 22659371c9d4SSatish Balay bdx = bij->j; 22669566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 22679566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2268cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2269cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2270cd0d46ebSvictorle 2271cd0d46ebSvictorle *f = PETSC_TRUE; 2272cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2273cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 227497f1f81fSBarry Smith PetscInt idc, idr; 22755485867bSBarry Smith PetscScalar vc, vr; 2276cd0d46ebSvictorle /* column/row index/value */ 22775485867bSBarry Smith idc = adx[aptr[i]]; 22785485867bSBarry Smith idr = bdx[bptr[idc]]; 22795485867bSBarry Smith vc = va[aptr[i]]; 22805485867bSBarry Smith vr = vb[bptr[idc]]; 22815485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 22825485867bSBarry Smith *f = PETSC_FALSE; 22835485867bSBarry Smith goto done; 2284cd0d46ebSvictorle } else { 22855485867bSBarry Smith aptr[i]++; 22865485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2287cd0d46ebSvictorle } 2288cd0d46ebSvictorle } 2289cd0d46ebSvictorle } 2290cd0d46ebSvictorle done: 22919566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 22929566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 22939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 22949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 22953ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2296cd0d46ebSvictorle } 2297cd0d46ebSvictorle 2298ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2299d71ae5a4SJacob Faibussowitsch { 23003d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 230154f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 230254f21887SBarry Smith MatScalar *va, *vb; 23031cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23041cbb95d3SBarry Smith 23051cbb95d3SBarry Smith PetscFunctionBegin; 23069566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23079566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23081cbb95d3SBarry Smith if (ma != nb || na != mb) { 23091cbb95d3SBarry Smith *f = PETSC_FALSE; 23103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23111cbb95d3SBarry Smith } 23129371c9d4SSatish Balay aii = aij->i; 23139371c9d4SSatish Balay bii = bij->i; 23149371c9d4SSatish Balay adx = aij->j; 23159371c9d4SSatish Balay bdx = bij->j; 23169371c9d4SSatish Balay va = aij->a; 23179371c9d4SSatish Balay vb = bij->a; 23189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23201cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 23211cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 23221cbb95d3SBarry Smith 23231cbb95d3SBarry Smith *f = PETSC_TRUE; 23241cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 23251cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 23261cbb95d3SBarry Smith PetscInt idc, idr; 23271cbb95d3SBarry Smith PetscScalar vc, vr; 23281cbb95d3SBarry Smith /* column/row index/value */ 23291cbb95d3SBarry Smith idc = adx[aptr[i]]; 23301cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 23311cbb95d3SBarry Smith vc = va[aptr[i]]; 23321cbb95d3SBarry Smith vr = vb[bptr[idc]]; 23331cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 23341cbb95d3SBarry Smith *f = PETSC_FALSE; 23351cbb95d3SBarry Smith goto done; 23361cbb95d3SBarry Smith } else { 23371cbb95d3SBarry Smith aptr[i]++; 23381cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 23391cbb95d3SBarry Smith } 23401cbb95d3SBarry Smith } 23411cbb95d3SBarry Smith } 23421cbb95d3SBarry Smith done: 23439566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23449566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23461cbb95d3SBarry Smith } 23471cbb95d3SBarry Smith 2348d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2349d71ae5a4SJacob Faibussowitsch { 2350416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2351fff8e43fSBarry Smith const PetscScalar *l, *r; 2352fff8e43fSBarry Smith PetscScalar x; 235354f21887SBarry Smith MatScalar *v; 2354fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2355fff8e43fSBarry Smith const PetscInt *jj; 235617ab2063SBarry Smith 23573a40ed3dSBarry Smith PetscFunctionBegin; 235817ab2063SBarry Smith if (ll) { 23593ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 23603ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 23619566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 236208401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 23639566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 23649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 236517ab2063SBarry Smith for (i = 0; i < m; i++) { 236617ab2063SBarry Smith x = l[i]; 2367416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 23682205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 236917ab2063SBarry Smith } 23709566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 23719566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 23729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 237317ab2063SBarry Smith } 237417ab2063SBarry Smith if (rr) { 23759566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 237608401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 23779566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 23789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 23792e5835c6SStefano Zampini jj = a->j; 23802205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 23819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 23829566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 23839566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 238417ab2063SBarry Smith } 23853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 238617ab2063SBarry Smith } 238717ab2063SBarry Smith 2388d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2389d71ae5a4SJacob Faibussowitsch { 2390db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2391d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 239297f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 23935d0c19d7SBarry Smith const PetscInt *irow, *icol; 23942e5835c6SStefano Zampini const PetscScalar *aa; 23955d0c19d7SBarry Smith PetscInt nrows, ncols; 239697f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 2397fb3c7e2dSJunchao Zhang MatScalar *a_new, *mat_a, *c_a; 2398416022c9SBarry Smith Mat C; 2399cdc6f3adSToby Isaac PetscBool stride; 240017ab2063SBarry Smith 24013a40ed3dSBarry Smith PetscFunctionBegin; 24029566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24039566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24049566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 240517ab2063SBarry Smith 24069566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2407ff718158SBarry Smith if (stride) { 24089566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2409ff718158SBarry Smith } else { 2410ff718158SBarry Smith first = 0; 2411ff718158SBarry Smith step = 0; 2412ff718158SBarry Smith } 2413fee21e36SBarry Smith if (stride && step == 1) { 241402834360SBarry Smith /* special case of contiguous rows */ 24159566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 241602834360SBarry Smith /* loop over new rows determining lens and starting points */ 241702834360SBarry Smith for (i = 0; i < nrows; i++) { 2418bfeeae90SHong Zhang kstart = ai[irow[i]]; 2419a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2420a91a9bebSLisandro Dalcin starts[i] = kstart; 242102834360SBarry Smith for (k = kstart; k < kend; k++) { 2422bfeeae90SHong Zhang if (aj[k] >= first) { 242302834360SBarry Smith starts[i] = k; 242402834360SBarry Smith break; 242502834360SBarry Smith } 242602834360SBarry Smith } 2427a2744918SBarry Smith sum = 0; 242802834360SBarry Smith while (k < kend) { 2429bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2430a2744918SBarry Smith sum++; 243102834360SBarry Smith } 2432a2744918SBarry Smith lens[i] = sum; 243302834360SBarry Smith } 243402834360SBarry Smith /* create submatrix */ 2435cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 243697f1f81fSBarry Smith PetscInt n_cols, n_rows; 24379566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2438aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 24399566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 244008480c60SBarry Smith C = *B; 24413a40ed3dSBarry Smith } else { 24423bef6203SJed Brown PetscInt rbs, cbs; 24439566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 24449566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 24459566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 24469566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 24479566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 24489566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 24499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 245008480c60SBarry Smith } 2451db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2452db02288aSLois Curfman McInnes 245302834360SBarry Smith /* loop over rows inserting into submatrix */ 2454fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C 2455db02288aSLois Curfman McInnes j_new = c->j; 2456db02288aSLois Curfman McInnes i_new = c->i; 24579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 245802834360SBarry Smith for (i = 0; i < nrows; i++) { 2459a2744918SBarry Smith ii = starts[i]; 2460a2744918SBarry Smith lensi = lens[i]; 2461810441c8SPierre Jolivet if (lensi) { 2462ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 24639566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2464a2744918SBarry Smith a_new += lensi; 2465810441c8SPierre Jolivet } 2466a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2467a2744918SBarry Smith c->ilen[i] = lensi; 246802834360SBarry Smith } 2469fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly 24709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 24719566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 24723a40ed3dSBarry Smith } else { 24739566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 24749566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 24759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 24764dcab191SBarry Smith for (i = 0; i < ncols; i++) { 24776bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 24784dcab191SBarry Smith smap[icol[i]] = i + 1; 24794dcab191SBarry Smith } 24804dcab191SBarry Smith 248102834360SBarry Smith /* determine lens of each row */ 248202834360SBarry Smith for (i = 0; i < nrows; i++) { 2483bfeeae90SHong Zhang kstart = ai[irow[i]]; 248402834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 248502834360SBarry Smith lens[i] = 0; 248602834360SBarry Smith for (k = kstart; k < kend; k++) { 2487ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 248802834360SBarry Smith } 248902834360SBarry Smith } 249017ab2063SBarry Smith /* Create and fill new matrix */ 2491a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2492ace3abfcSBarry Smith PetscBool equal; 24930f5bd95cSBarry Smith 249499141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2495aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 24969566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 2497fdfbdca6SPierre Jolivet PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros"); 24989566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 249908480c60SBarry Smith C = *B; 25003a40ed3dSBarry Smith } else { 25013bef6203SJed Brown PetscInt rbs, cbs; 25029566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25039566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25049566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25059566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 250637a5e0faSPierre Jolivet if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25079566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 250908480c60SBarry Smith } 25109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2511fb3c7e2dSJunchao Zhang 2512f4f49eeaSPierre Jolivet c = (Mat_SeqAIJ *)C->data; 2513fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C 251417ab2063SBarry Smith for (i = 0; i < nrows; i++) { 251599141d43SSatish Balay row = irow[i]; 2516bfeeae90SHong Zhang kstart = ai[row]; 251799141d43SSatish Balay kend = kstart + a->ilen[row]; 2518bfeeae90SHong Zhang mat_i = c->i[i]; 25198e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 25208e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 252199141d43SSatish Balay mat_ilen = c->ilen + i; 252217ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2523bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2524ed480e8bSBarry Smith *mat_j++ = tcol - 1; 25252e5835c6SStefano Zampini *mat_a++ = aa[k]; 252699141d43SSatish Balay (*mat_ilen)++; 252717ab2063SBarry Smith } 252817ab2063SBarry Smith } 252917ab2063SBarry Smith } 25309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 253102834360SBarry Smith /* Free work space */ 25329566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 25339566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 25349566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2535cdc6f3adSToby Isaac /* sort */ 2536cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2537cdc6f3adSToby Isaac PetscInt ilen; 2538cdc6f3adSToby Isaac 2539cdc6f3adSToby Isaac mat_i = c->i[i]; 25408e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 25418e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 2542cdc6f3adSToby Isaac ilen = c->ilen[i]; 25439566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2544cdc6f3adSToby Isaac } 2545fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a)); 254602834360SBarry Smith } 25478c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 25489566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2549305c6ccfSStefano Zampini #endif 25509566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 25519566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 255217ab2063SBarry Smith 25539566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2554416022c9SBarry Smith *B = C; 25553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 255617ab2063SBarry Smith } 255717ab2063SBarry Smith 2558ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2559d71ae5a4SJacob Faibussowitsch { 256082d44351SHong Zhang Mat B; 256182d44351SHong Zhang 256282d44351SHong Zhang PetscFunctionBegin; 2563c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 25649566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 25659566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 25669566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 25679566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 25689566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 256982d44351SHong Zhang *subMat = B; 2570c2d650bdSHong Zhang } else { 25719566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2572c2d650bdSHong Zhang } 25733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 257482d44351SHong Zhang } 257582d44351SHong Zhang 2576ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2577d71ae5a4SJacob Faibussowitsch { 257863b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 257963b91edcSBarry Smith Mat outA; 2580ace3abfcSBarry Smith PetscBool row_identity, col_identity; 258163b91edcSBarry Smith 25823a40ed3dSBarry Smith PetscFunctionBegin; 258308401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 25841df811f5SHong Zhang 25859566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 25869566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2587a871dcd8SBarry Smith 258863b91edcSBarry Smith outA = inA; 25899566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 25909566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 25912205254eSKarl Rupp 25929566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 25939566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 25942205254eSKarl Rupp 2595c3122656SLisandro Dalcin a->row = row; 25962205254eSKarl Rupp 25979566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 25989566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 25992205254eSKarl Rupp 2600c3122656SLisandro Dalcin a->col = col; 260163b91edcSBarry Smith 260236db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26039566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26049566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2605f0ec6fceSSatish Balay 260694a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 260784648c2dSPierre Jolivet PetscCall(PetscMalloc1(inA->rmap->n, &a->solve_work)); 260894a9d846SBarry Smith } 260963b91edcSBarry Smith 2610137fb511SHong Zhang if (row_identity && col_identity) { 26119566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2612137fb511SHong Zhang } else { 26139566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2614137fb511SHong Zhang } 2615421480d9SBarry Smith outA->factortype = MAT_FACTOR_LU; 26163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2617a871dcd8SBarry Smith } 2618a871dcd8SBarry Smith 2619d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2620d71ae5a4SJacob Faibussowitsch { 2621f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2622dfa0f9e5SStefano Zampini PetscScalar *v; 2623c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 26243a40ed3dSBarry Smith 26253a40ed3dSBarry Smith PetscFunctionBegin; 26269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 26279566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2628792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 26299566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 26309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 26313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2632f0b747eeSBarry Smith } 2633f0b747eeSBarry Smith 2634d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2635d71ae5a4SJacob Faibussowitsch { 263616b64355SHong Zhang PetscInt i; 263716b64355SHong Zhang 263816b64355SHong Zhang PetscFunctionBegin; 263916b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 26409566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 264116b64355SHong Zhang 264248a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 26439566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 264416b64355SHong Zhang 264516b64355SHong Zhang if (submatj->rbuf1) { 26469566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 26479566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 264816b64355SHong Zhang } 264916b64355SHong Zhang 265048a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 26519566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 26529566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 265316b64355SHong Zhang } 265416b64355SHong Zhang 265516b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2656eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 26579566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 26589566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 265916b64355SHong Zhang #else 26609566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 266116b64355SHong Zhang #endif 266216b64355SHong Zhang 266316b64355SHong Zhang if (!submatj->allcolumns) { 266416b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2665835f2295SStefano Zampini PetscCall(PetscHMapIDestroy(&submatj->cmap)); 266616b64355SHong Zhang #else 26679566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 266816b64355SHong Zhang #endif 266916b64355SHong Zhang } 26709566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 267116b64355SHong Zhang 26729566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 26733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 267416b64355SHong Zhang } 267516b64355SHong Zhang 2676d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2677d71ae5a4SJacob Faibussowitsch { 267816b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 26795c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 268016b64355SHong Zhang 268116b64355SHong Zhang PetscFunctionBegin; 26829566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 26839566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 26843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 268516b64355SHong Zhang } 268616b64355SHong Zhang 268789a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2688ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2689d71ae5a4SJacob Faibussowitsch { 26902d033e1fSHong Zhang PetscInt i; 26910fb991dcSHong Zhang Mat C; 26920fb991dcSHong Zhang Mat_SeqAIJ *c; 26930fb991dcSHong Zhang Mat_SubSppt *submatj; 26942d033e1fSHong Zhang 26952d033e1fSHong Zhang PetscFunctionBegin; 26962d033e1fSHong Zhang for (i = 0; i < n; i++) { 26970fb991dcSHong Zhang C = (*mat)[i]; 26980fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 26990fb991dcSHong Zhang submatj = c->submatis1; 27002d033e1fSHong Zhang if (submatj) { 2701682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 270226cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27039566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27049566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27059566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27063faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27079566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27089566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27099566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2710682e4c99SStefano Zampini } 27112d033e1fSHong Zhang } else { 27129566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 27132d033e1fSHong Zhang } 27142d033e1fSHong Zhang } 271586e85357SHong Zhang 271663a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 27179566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 271863a75b2aSHong Zhang 27199566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 27203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 27212d033e1fSHong Zhang } 27222d033e1fSHong Zhang 2723ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2724d71ae5a4SJacob Faibussowitsch { 272597f1f81fSBarry Smith PetscInt i; 2726cddf8d76SBarry Smith 27273a40ed3dSBarry Smith PetscFunctionBegin; 272848a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2729cddf8d76SBarry Smith 273048a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 27313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2732cddf8d76SBarry Smith } 2733cddf8d76SBarry Smith 2734ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2735d71ae5a4SJacob Faibussowitsch { 2736e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 27379a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 27385d0c19d7SBarry Smith const PetscInt *idx; 273958b7e2c1SStefano Zampini PetscInt start, end, *ai, *aj, bs = A->rmap->bs == A->cmap->bs ? A->rmap->bs : 1; 2740f1af5d2fSBarry Smith PetscBT table; 2741bbd702dbSSatish Balay 27423a40ed3dSBarry Smith PetscFunctionBegin; 27439a88ca10SBarry Smith m = A->rmap->n / bs; 2744e4d965acSSatish Balay ai = a->i; 2745bfeeae90SHong Zhang aj = a->j; 27468a047759SSatish Balay 274708401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 274806763907SSatish Balay 27499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 27509566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 275106763907SSatish Balay 2752e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2753b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2754e4d965acSSatish Balay isz = 0; 27559566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2756e4d965acSSatish Balay 2757e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 27589566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 27599566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2760e4d965acSSatish Balay 27619a88ca10SBarry Smith if (bs > 1) { 27629a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 27639a88ca10SBarry Smith for (j = 0; j < n; ++j) { 27649a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 27659a88ca10SBarry Smith } 27669a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 27679a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 27689a88ca10SBarry Smith 27699a88ca10SBarry Smith k = 0; 27709a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 27719a88ca10SBarry Smith n = isz; 27729a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 27739a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 27749a88ca10SBarry Smith row = bs * nidx[k] + ll; 27759a88ca10SBarry Smith start = ai[row]; 27769a88ca10SBarry Smith end = ai[row + 1]; 27779a88ca10SBarry Smith for (l = start; l < end; l++) { 27789a88ca10SBarry Smith val = aj[l] / bs; 27799a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 27809a88ca10SBarry Smith } 27819a88ca10SBarry Smith } 27829a88ca10SBarry Smith } 27839a88ca10SBarry Smith } 278457508eceSPierre Jolivet PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, is + i)); 27859a88ca10SBarry Smith } else { 2786dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2787e4d965acSSatish Balay for (j = 0; j < n; ++j) { 27882205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 27894dcbc457SBarry Smith } 27909566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 27919566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2792e4d965acSSatish Balay 279304a348a9SBarry Smith k = 0; 279404a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 279504a348a9SBarry Smith n = isz; 279606763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2797e4d965acSSatish Balay row = nidx[k]; 2798e4d965acSSatish Balay start = ai[row]; 2799e4d965acSSatish Balay end = ai[row + 1]; 280004a348a9SBarry Smith for (l = start; l < end; l++) { 2801efb16452SHong Zhang val = aj[l]; 28022205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2803e4d965acSSatish Balay } 2804e4d965acSSatish Balay } 2805e4d965acSSatish Balay } 280657508eceSPierre Jolivet PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, is + i)); 2807e4d965acSSatish Balay } 28089a88ca10SBarry Smith } 28099566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28109566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28124dcbc457SBarry Smith } 281317ab2063SBarry Smith 2814ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2815d71ae5a4SJacob Faibussowitsch { 28160513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28173b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 28185d0c19d7SBarry Smith const PetscInt *row, *col; 28195d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 282056cd22aeSBarry Smith IS icolp, irowp; 28210298fd71SBarry Smith PetscInt *cwork = NULL; 28220298fd71SBarry Smith PetscScalar *vwork = NULL; 28230513a670SBarry Smith 28243a40ed3dSBarry Smith PetscFunctionBegin; 28259566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 28269566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 28279566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 28289566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 28290513a670SBarry Smith 28300513a670SBarry Smith /* determine lengths of permuted rows */ 28319566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 28322205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 28339566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 28349566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 28359566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 28369566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 28379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 28389566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 28390513a670SBarry Smith 28409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 28410513a670SBarry Smith for (i = 0; i < m; i++) { 28429566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 28432205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 28449566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 28459566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 28460513a670SBarry Smith } 28479566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 28482205254eSKarl Rupp 28493c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 28502205254eSKarl Rupp 28518c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 28529566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 28539fe5e383SStefano Zampini #endif 28549566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 28559566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 28569566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 28579566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 28589566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 28599566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 286048a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 28613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28620513a670SBarry Smith } 28630513a670SBarry Smith 2864d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2865d71ae5a4SJacob Faibussowitsch { 2866cb5b572fSBarry Smith PetscFunctionBegin; 286733f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 286833f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2869be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2870be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 28712e5835c6SStefano Zampini const PetscScalar *aa; 28723ac85a22SJunchao Zhang PetscScalar *bb; 2873be6bf707SBarry Smith 28749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 28753ac85a22SJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(B, &bb)); 28763ac85a22SJunchao Zhang 287708401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 28783ac85a22SJunchao Zhang PetscCall(PetscArraycpy(bb, aa, a->i[A->rmap->n])); 28799566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 28809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 28813ac85a22SJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(B, &bb)); 2882cb5b572fSBarry Smith } else { 28839566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2884cb5b572fSBarry Smith } 28853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2886cb5b572fSBarry Smith } 2887cb5b572fSBarry Smith 2888d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2889d71ae5a4SJacob Faibussowitsch { 28906c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28916e111a19SKarl Rupp 28926c0721eeSBarry Smith PetscFunctionBegin; 28936c0721eeSBarry Smith *array = a->a; 28943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28956c0721eeSBarry Smith } 28966c0721eeSBarry Smith 2897d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2898d71ae5a4SJacob Faibussowitsch { 28996c0721eeSBarry Smith PetscFunctionBegin; 2900f38c1e66SStefano Zampini *array = NULL; 29013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29026c0721eeSBarry Smith } 2903273d9f13SBarry Smith 29048229c054SShri Abhyankar /* 29058229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29068229c054SShri Abhyankar have different nonzero structure. 29078229c054SShri Abhyankar */ 2908d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2909d71ae5a4SJacob Faibussowitsch { 2910b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2911ec7775f6SShri Abhyankar 2912ec7775f6SShri Abhyankar PetscFunctionBegin; 2913ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2914ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 29158e3a54c0SPierre Jolivet const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]); 2916b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 2917b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 29188af7cee1SJed Brown nnz[i] = 0; 29198af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 2920b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 2921b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 29228af7cee1SJed Brown nnz[i]++; 29238af7cee1SJed Brown } 29248af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 2925ec7775f6SShri Abhyankar } 29263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2927ec7775f6SShri Abhyankar } 2928ec7775f6SShri Abhyankar 2929d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 2930d71ae5a4SJacob Faibussowitsch { 2931b264fe52SHong Zhang PetscInt m = Y->rmap->N; 2932b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 2933b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 2934b264fe52SHong Zhang 2935b264fe52SHong Zhang PetscFunctionBegin; 2936b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 29379566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 29383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2939b264fe52SHong Zhang } 2940b264fe52SHong Zhang 2941d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 2942d71ae5a4SJacob Faibussowitsch { 2943ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 2944ac90fabeSBarry Smith 2945ac90fabeSBarry Smith PetscFunctionBegin; 2946134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 2947134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 2948134adf20SPierre Jolivet if (e) { 29499566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 295081fa06acSBarry Smith if (e) { 29519566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 2952134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 295381fa06acSBarry Smith } 295481fa06acSBarry Smith } 295554c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 295681fa06acSBarry Smith } 2957ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 29582e5835c6SStefano Zampini const PetscScalar *xa; 29592e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 296081fa06acSBarry Smith PetscBLASInt one = 1, bnz; 296181fa06acSBarry Smith 29629566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 29639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 29649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 2965792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 29669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 29679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 29689566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 29699566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 2970ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 29719566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 2972ac90fabeSBarry Smith } else { 29738229c054SShri Abhyankar Mat B; 29748229c054SShri Abhyankar PetscInt *nnz; 29759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 29769566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 29779566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 29789566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 29799566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 29809566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 29819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 29829566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 29839566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 29849bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 29859566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 2986ac90fabeSBarry Smith } 29873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2988ac90fabeSBarry Smith } 2989ac90fabeSBarry Smith 2990d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 2991d71ae5a4SJacob Faibussowitsch { 2992354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 2993354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 2994354c94deSBarry Smith PetscInt i, nz; 2995354c94deSBarry Smith PetscScalar *a; 2996354c94deSBarry Smith 2997354c94deSBarry Smith PetscFunctionBegin; 2998354c94deSBarry Smith nz = aij->nz; 29999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30002205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3002354c94deSBarry Smith #else 3003354c94deSBarry Smith PetscFunctionBegin; 3004354c94deSBarry Smith #endif 30053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3006354c94deSBarry Smith } 3007354c94deSBarry Smith 3008ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3009d71ae5a4SJacob Faibussowitsch { 3010e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3011d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3012e34fafa9SBarry Smith PetscReal atmp; 3013985db425SBarry Smith PetscScalar *x; 3014ce496241SStefano Zampini const MatScalar *aa, *av; 3015e34fafa9SBarry Smith 3016e34fafa9SBarry Smith PetscFunctionBegin; 301728b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 30189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3019ce496241SStefano Zampini aa = av; 3020e34fafa9SBarry Smith ai = a->i; 3021e34fafa9SBarry Smith aj = a->j; 3022e34fafa9SBarry Smith 30239566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 30249566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 302508401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3026e34fafa9SBarry Smith for (i = 0; i < m; i++) { 30279371c9d4SSatish Balay ncols = ai[1] - ai[0]; 30289371c9d4SSatish Balay ai++; 302962e5df07SMark Adams x[i] = 0; 3030e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3031985db425SBarry Smith atmp = PetscAbsScalar(*aa); 30329371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 30339371c9d4SSatish Balay x[i] = atmp; 30349371c9d4SSatish Balay if (idx) idx[i] = *aj; 30359371c9d4SSatish Balay } 30369371c9d4SSatish Balay aa++; 30379371c9d4SSatish Balay aj++; 3038985db425SBarry Smith } 3039985db425SBarry Smith } 30409566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 30419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 30423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3043985db425SBarry Smith } 3044985db425SBarry Smith 3045eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v) 3046eede4a3fSMark Adams { 3047eede4a3fSMark Adams Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3048eede4a3fSMark Adams PetscInt i, j, m = A->rmap->n, *ai, ncols, n; 3049eede4a3fSMark Adams PetscScalar *x; 3050eede4a3fSMark Adams const MatScalar *aa, *av; 3051eede4a3fSMark Adams 3052eede4a3fSMark Adams PetscFunctionBegin; 3053eede4a3fSMark Adams PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3054eede4a3fSMark Adams PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3055eede4a3fSMark Adams aa = av; 3056eede4a3fSMark Adams ai = a->i; 3057eede4a3fSMark Adams 3058eede4a3fSMark Adams PetscCall(VecGetArrayWrite(v, &x)); 3059eede4a3fSMark Adams PetscCall(VecGetLocalSize(v, &n)); 3060eede4a3fSMark Adams PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3061eede4a3fSMark Adams for (i = 0; i < m; i++) { 3062eede4a3fSMark Adams ncols = ai[1] - ai[0]; 3063eede4a3fSMark Adams ai++; 306462e5df07SMark Adams x[i] = 0; 3065eede4a3fSMark Adams for (j = 0; j < ncols; j++) { 3066eede4a3fSMark Adams x[i] += PetscAbsScalar(*aa); 3067eede4a3fSMark Adams aa++; 3068eede4a3fSMark Adams } 3069eede4a3fSMark Adams } 3070eede4a3fSMark Adams PetscCall(VecRestoreArrayWrite(v, &x)); 3071eede4a3fSMark Adams PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3072eede4a3fSMark Adams PetscFunctionReturn(PETSC_SUCCESS); 3073eede4a3fSMark Adams } 3074eede4a3fSMark Adams 3075ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3076d71ae5a4SJacob Faibussowitsch { 3077985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3078d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3079985db425SBarry Smith PetscScalar *x; 3080ce496241SStefano Zampini const MatScalar *aa, *av; 3081985db425SBarry Smith 3082985db425SBarry Smith PetscFunctionBegin; 308328b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 30849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3085ce496241SStefano Zampini aa = av; 3086985db425SBarry Smith ai = a->i; 3087985db425SBarry Smith aj = a->j; 3088985db425SBarry Smith 30899566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 30909566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 309108401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3092985db425SBarry Smith for (i = 0; i < m; i++) { 30939371c9d4SSatish Balay ncols = ai[1] - ai[0]; 30949371c9d4SSatish Balay ai++; 3095d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 30969371c9d4SSatish Balay x[i] = *aa; 30979371c9d4SSatish Balay if (idx) idx[i] = 0; 3098985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3099985db425SBarry Smith x[i] = 0.0; 3100985db425SBarry Smith if (idx) { 3101985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3102985db425SBarry Smith if (aj[j] > j) { 3103985db425SBarry Smith idx[i] = j; 3104985db425SBarry Smith break; 3105985db425SBarry Smith } 3106985db425SBarry Smith } 31071a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31081a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3109985db425SBarry Smith } 3110985db425SBarry Smith } 3111985db425SBarry Smith for (j = 0; j < ncols; j++) { 31129371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31139371c9d4SSatish Balay x[i] = *aa; 31149371c9d4SSatish Balay if (idx) idx[i] = *aj; 31159371c9d4SSatish Balay } 31169371c9d4SSatish Balay aa++; 31179371c9d4SSatish Balay aj++; 3118985db425SBarry Smith } 3119985db425SBarry Smith } 31209566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3123985db425SBarry Smith } 3124985db425SBarry Smith 3125ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3126d71ae5a4SJacob Faibussowitsch { 3127c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3128c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3129ce496241SStefano Zampini PetscScalar *x; 3130ce496241SStefano Zampini const MatScalar *aa, *av; 3131c87e5d42SMatthew Knepley 3132c87e5d42SMatthew Knepley PetscFunctionBegin; 31339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3134ce496241SStefano Zampini aa = av; 3135c87e5d42SMatthew Knepley ai = a->i; 3136c87e5d42SMatthew Knepley aj = a->j; 3137c87e5d42SMatthew Knepley 31389566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31399566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 314008401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3141c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 31429371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31439371c9d4SSatish Balay ai++; 3144f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 31459371c9d4SSatish Balay x[i] = *aa; 31469371c9d4SSatish Balay if (idx) idx[i] = 0; 3147f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3148f07e67edSHong Zhang x[i] = 0.0; 3149f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3150289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3151f07e67edSHong Zhang if (aj[j] > j) { 3152f07e67edSHong Zhang idx[i] = j; 31532205254eSKarl Rupp break; 31542205254eSKarl Rupp } 3155289a08f5SMatthew Knepley } 3156f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3157f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3158f07e67edSHong Zhang } 3159289a08f5SMatthew Knepley } 3160c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 31619371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 31629371c9d4SSatish Balay x[i] = *aa; 31639371c9d4SSatish Balay if (idx) idx[i] = *aj; 31649371c9d4SSatish Balay } 31659371c9d4SSatish Balay aa++; 31669371c9d4SSatish Balay aj++; 3167c87e5d42SMatthew Knepley } 3168c87e5d42SMatthew Knepley } 31699566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3172c87e5d42SMatthew Knepley } 3173c87e5d42SMatthew Knepley 3174ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3175d71ae5a4SJacob Faibussowitsch { 3176985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3177d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3178d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3179985db425SBarry Smith PetscScalar *x; 3180ce496241SStefano Zampini const MatScalar *aa, *av; 3181985db425SBarry Smith 3182985db425SBarry Smith PetscFunctionBegin; 318328b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3185ce496241SStefano Zampini aa = av; 3186985db425SBarry Smith ai = a->i; 3187985db425SBarry Smith aj = a->j; 3188985db425SBarry Smith 31899566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31909566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 319108401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3192985db425SBarry Smith for (i = 0; i < m; i++) { 31939371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31949371c9d4SSatish Balay ai++; 3195d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31969371c9d4SSatish Balay x[i] = *aa; 31979371c9d4SSatish Balay if (idx) idx[i] = 0; 3198985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3199985db425SBarry Smith x[i] = 0.0; 3200985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3201985db425SBarry Smith for (j = 0; j < ncols; j++) { 3202985db425SBarry Smith if (aj[j] > j) { 3203985db425SBarry Smith idx[i] = j; 3204985db425SBarry Smith break; 3205985db425SBarry Smith } 3206985db425SBarry Smith } 3207fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3208fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3209985db425SBarry Smith } 3210985db425SBarry Smith } 3211985db425SBarry Smith for (j = 0; j < ncols; j++) { 32129371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32139371c9d4SSatish Balay x[i] = *aa; 32149371c9d4SSatish Balay if (idx) idx[i] = *aj; 32159371c9d4SSatish Balay } 32169371c9d4SSatish Balay aa++; 32179371c9d4SSatish Balay aj++; 3218e34fafa9SBarry Smith } 3219e34fafa9SBarry Smith } 32209566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3223e34fafa9SBarry Smith } 3224bbead8a2SBarry Smith 3225ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3226d71ae5a4SJacob Faibussowitsch { 3227bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 322858b7e2c1SStefano Zampini PetscInt i, bs = A->rmap->bs, mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3229bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 32300da83c2eSBarry Smith const PetscReal shift = 0.0; 32311a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3232bbead8a2SBarry Smith 3233bbead8a2SBarry Smith PetscFunctionBegin; 3234a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 32354a0d0026SBarry Smith if (a->ibdiagvalid) { 32364a0d0026SBarry Smith if (values) *values = a->ibdiag; 32373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 32384a0d0026SBarry Smith } 32393a7d0413SPierre Jolivet if (!a->ibdiag) PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); 3240bbead8a2SBarry Smith diag = a->ibdiag; 3241bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3242bbead8a2SBarry Smith /* factor and invert each block */ 3243bbead8a2SBarry Smith switch (bs) { 3244bbead8a2SBarry Smith case 1: 3245bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 32469566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3247ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3248966bd95aSPierre Jolivet PetscCheck(allowzeropivot, PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 32497b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 32507b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 32517b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 32529566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 3253ec1892c8SHong Zhang } 3254bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3255bbead8a2SBarry Smith } 3256bbead8a2SBarry Smith break; 3257bbead8a2SBarry Smith case 2: 3258bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 32599371c9d4SSatish Balay ij[0] = 2 * i; 32609371c9d4SSatish Balay ij[1] = 2 * i + 1; 32619566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 32629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 32637b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 32649566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3265bbead8a2SBarry Smith diag += 4; 3266bbead8a2SBarry Smith } 3267bbead8a2SBarry Smith break; 3268bbead8a2SBarry Smith case 3: 3269bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 32709371c9d4SSatish Balay ij[0] = 3 * i; 32719371c9d4SSatish Balay ij[1] = 3 * i + 1; 32729371c9d4SSatish Balay ij[2] = 3 * i + 2; 32739566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 32749566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 32757b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 32769566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3277bbead8a2SBarry Smith diag += 9; 3278bbead8a2SBarry Smith } 3279bbead8a2SBarry Smith break; 3280bbead8a2SBarry Smith case 4: 3281bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 32829371c9d4SSatish Balay ij[0] = 4 * i; 32839371c9d4SSatish Balay ij[1] = 4 * i + 1; 32849371c9d4SSatish Balay ij[2] = 4 * i + 2; 32859371c9d4SSatish Balay ij[3] = 4 * i + 3; 32869566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 32879566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 32887b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 32899566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3290bbead8a2SBarry Smith diag += 16; 3291bbead8a2SBarry Smith } 3292bbead8a2SBarry Smith break; 3293bbead8a2SBarry Smith case 5: 3294bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 32959371c9d4SSatish Balay ij[0] = 5 * i; 32969371c9d4SSatish Balay ij[1] = 5 * i + 1; 32979371c9d4SSatish Balay ij[2] = 5 * i + 2; 32989371c9d4SSatish Balay ij[3] = 5 * i + 3; 32999371c9d4SSatish Balay ij[4] = 5 * i + 4; 33009566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33019566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33027b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33039566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3304bbead8a2SBarry Smith diag += 25; 3305bbead8a2SBarry Smith } 3306bbead8a2SBarry Smith break; 3307bbead8a2SBarry Smith case 6: 3308bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33099371c9d4SSatish Balay ij[0] = 6 * i; 33109371c9d4SSatish Balay ij[1] = 6 * i + 1; 33119371c9d4SSatish Balay ij[2] = 6 * i + 2; 33129371c9d4SSatish Balay ij[3] = 6 * i + 3; 33139371c9d4SSatish Balay ij[4] = 6 * i + 4; 33149371c9d4SSatish Balay ij[5] = 6 * i + 5; 33159566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33169566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33177b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33189566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3319bbead8a2SBarry Smith diag += 36; 3320bbead8a2SBarry Smith } 3321bbead8a2SBarry Smith break; 3322bbead8a2SBarry Smith case 7: 3323bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33249371c9d4SSatish Balay ij[0] = 7 * i; 33259371c9d4SSatish Balay ij[1] = 7 * i + 1; 33269371c9d4SSatish Balay ij[2] = 7 * i + 2; 33279371c9d4SSatish Balay ij[3] = 7 * i + 3; 33289371c9d4SSatish Balay ij[4] = 7 * i + 4; 33299371c9d4SSatish Balay ij[5] = 7 * i + 5; 3330cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 33319566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 33329566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 33337b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33349566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3335bbead8a2SBarry Smith diag += 49; 3336bbead8a2SBarry Smith } 3337bbead8a2SBarry Smith break; 3338bbead8a2SBarry Smith default: 33399566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3340bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3341ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 33429566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 33439566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 33447b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33459566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3346bbead8a2SBarry Smith diag += bs2; 3347bbead8a2SBarry Smith } 33489566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3349bbead8a2SBarry Smith } 3350bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 33513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3352bbead8a2SBarry Smith } 3353bbead8a2SBarry Smith 3354d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3355d71ae5a4SJacob Faibussowitsch { 335673a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3357fff043a9SJunchao Zhang PetscScalar a, *aa; 335873a71a0fSBarry Smith PetscInt m, n, i, j, col; 335973a71a0fSBarry Smith 336073a71a0fSBarry Smith PetscFunctionBegin; 336173a71a0fSBarry Smith if (!x->assembled) { 33629566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 336373a71a0fSBarry Smith for (i = 0; i < m; i++) { 336473a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 33659566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 336673a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 33679566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 336873a71a0fSBarry Smith } 336973a71a0fSBarry Smith } 3370e2ce353bSJunchao Zhang } else { 33719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 33729566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 33739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3374e2ce353bSJunchao Zhang } 33759566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 33769566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 33773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 337873a71a0fSBarry Smith } 337973a71a0fSBarry Smith 3380679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3381d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3382d71ae5a4SJacob Faibussowitsch { 3383679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3384679944adSJunchao Zhang PetscScalar a; 3385679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3386679944adSJunchao Zhang 3387679944adSJunchao Zhang PetscFunctionBegin; 3388679944adSJunchao Zhang nskip = high - low; 33899566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3390679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3391679944adSJunchao Zhang for (i = 0; i < m; i++) { 3392679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 33939566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3394679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3395679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 33969566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3397679944adSJunchao Zhang } 3398e2ce353bSJunchao Zhang } 33999566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34009566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3402679944adSJunchao Zhang } 3403679944adSJunchao Zhang 34040a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3405cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3406cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3407cb5b572fSBarry Smith MatMult_SeqAIJ, 340897304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34097c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34107c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3411f4259b30SLisandro Dalcin NULL, 3412f4259b30SLisandro Dalcin NULL, 3413f4259b30SLisandro Dalcin NULL, 3414f4259b30SLisandro Dalcin /* 10*/ NULL, 3415cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3416f4259b30SLisandro Dalcin NULL, 341741f059aeSBarry Smith MatSOR_SeqAIJ, 341891e9d3e2SHong Zhang MatTranspose_SeqAIJ, 341997304618SKris Buschelman /* 15*/ MatGetInfo_SeqAIJ, 3420cb5b572fSBarry Smith MatEqual_SeqAIJ, 3421cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3422cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3423cb5b572fSBarry Smith MatNorm_SeqAIJ, 3424f4259b30SLisandro Dalcin /* 20*/ NULL, 3425cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3426cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3427cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3428d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3429f4259b30SLisandro Dalcin NULL, 3430f4259b30SLisandro Dalcin NULL, 3431f4259b30SLisandro Dalcin NULL, 3432f4259b30SLisandro Dalcin NULL, 343326cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 3434f4259b30SLisandro Dalcin NULL, 3435f4259b30SLisandro Dalcin NULL, 3436f4259b30SLisandro Dalcin NULL, 3437f4259b30SLisandro Dalcin NULL, 3438d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3439f4259b30SLisandro Dalcin NULL, 3440f4259b30SLisandro Dalcin NULL, 3441cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3442f4259b30SLisandro Dalcin NULL, 3443d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 34447dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3445cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3446cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3447cb5b572fSBarry Smith MatCopy_SeqAIJ, 3448d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3449cb5b572fSBarry Smith MatScale_SeqAIJ, 34507d68702bSBarry Smith MatShift_SeqAIJ, 345179299369SBarry Smith MatDiagonalSet_SeqAIJ, 34526e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 345373a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 34543b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 34553b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 34563b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3457a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 345893dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3459f4259b30SLisandro Dalcin NULL, 3460f4259b30SLisandro Dalcin NULL, 3461cda55fadSBarry Smith MatPermute_SeqAIJ, 3462f4259b30SLisandro Dalcin NULL, 3463f4259b30SLisandro Dalcin /* 59*/ NULL, 3464b9b97703SBarry Smith MatDestroy_SeqAIJ, 3465b9b97703SBarry Smith MatView_SeqAIJ, 3466f4259b30SLisandro Dalcin NULL, 3467f4259b30SLisandro Dalcin NULL, 34688bb0f5c6SPierre Jolivet /* 64*/ MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3469f4259b30SLisandro Dalcin NULL, 3470f4259b30SLisandro Dalcin NULL, 3471f4259b30SLisandro Dalcin NULL, 34728bb0f5c6SPierre Jolivet MatGetRowMaxAbs_SeqAIJ, 34738bb0f5c6SPierre Jolivet /* 69*/ MatGetRowMinAbs_SeqAIJ, 3474f4259b30SLisandro Dalcin NULL, 3475f4259b30SLisandro Dalcin NULL, 34763acb8795SBarry Smith MatFDColoringApply_AIJ, 3477f4259b30SLisandro Dalcin NULL, 34788bb0f5c6SPierre Jolivet /* 74*/ MatFindZeroDiagonals_SeqAIJ, 3479f4259b30SLisandro Dalcin NULL, 3480f4259b30SLisandro Dalcin NULL, 3481f4259b30SLisandro Dalcin NULL, 3482bc011b1eSHong Zhang MatLoad_SeqAIJ, 34838bb0f5c6SPierre Jolivet /* 79*/ NULL, 34848bb0f5c6SPierre Jolivet NULL, 34858bb0f5c6SPierre Jolivet NULL, 34868bb0f5c6SPierre Jolivet NULL, 34878bb0f5c6SPierre Jolivet NULL, 34886cff0a6bSPierre Jolivet /* 84*/ NULL, 348926be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 34908bb0f5c6SPierre Jolivet MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3491f4259b30SLisandro Dalcin NULL, 34926fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 34938bb0f5c6SPierre Jolivet /* 90*/ NULL, 34948bb0f5c6SPierre Jolivet MatProductSetFromOptions_SeqAIJ, 3495f4259b30SLisandro Dalcin NULL, 3496f4259b30SLisandro Dalcin NULL, 349787d4246cSBarry Smith MatConjugate_SeqAIJ, 34988bb0f5c6SPierre Jolivet /* 94*/ NULL, 34998bb0f5c6SPierre Jolivet MatSetValuesRow_SeqAIJ, 350099cafbc1SBarry Smith MatRealPart_SeqAIJ, 3501f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3502f4259b30SLisandro Dalcin NULL, 35038bb0f5c6SPierre Jolivet /* 99*/ NULL, 35048bb0f5c6SPierre Jolivet MatMatSolve_SeqAIJ, 3505f4259b30SLisandro Dalcin NULL, 35062af78befSBarry Smith MatGetRowMin_SeqAIJ, 3507f4259b30SLisandro Dalcin NULL, 3508421480d9SBarry Smith /*104*/ NULL, 3509f4259b30SLisandro Dalcin NULL, 3510f4259b30SLisandro Dalcin NULL, 3511f4259b30SLisandro Dalcin NULL, 3512f4259b30SLisandro Dalcin NULL, 35138bb0f5c6SPierre Jolivet /*109*/ NULL, 3514f4259b30SLisandro Dalcin NULL, 3515f4259b30SLisandro Dalcin NULL, 3516f4259b30SLisandro Dalcin NULL, 3517421480d9SBarry Smith MatGetMultiProcBlock_SeqAIJ, 3518421480d9SBarry Smith /*114*/ MatFindNonzeroRows_SeqAIJ, 3519a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 352037868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 35210da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3522f4259b30SLisandro Dalcin NULL, 3523421480d9SBarry Smith /*119*/ NULL, 3524f4259b30SLisandro Dalcin NULL, 352575648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3526b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3527421480d9SBarry Smith MatTransColoringApplySpToDen_SeqAIJ, 3528421480d9SBarry Smith /*124*/ MatTransColoringApplyDenToSp_SeqAIJ, 35293964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 35308bb0f5c6SPierre Jolivet NULL, 35318bb0f5c6SPierre Jolivet NULL, 3532421480d9SBarry Smith MatFDColoringSetUp_SeqXAIJ, 3533421480d9SBarry Smith /*129*/ MatFindOffBlockDiagonalEntries_SeqAIJ, 35348bb0f5c6SPierre Jolivet MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 35358bb0f5c6SPierre Jolivet MatDestroySubMatrices_SeqAIJ, 35368bb0f5c6SPierre Jolivet NULL, 3537421480d9SBarry Smith NULL, 3538421480d9SBarry Smith /*134*/ MatCreateGraph_Simple_AIJ, 35398bb0f5c6SPierre Jolivet MatTransposeSymbolic_SeqAIJ, 35408bb0f5c6SPierre Jolivet MatEliminateZeros_SeqAIJ, 35418bb0f5c6SPierre Jolivet MatGetRowSumAbs_SeqAIJ, 3542f4259b30SLisandro Dalcin NULL, 3543421480d9SBarry Smith /*139*/ NULL, 3544f4259b30SLisandro Dalcin NULL, 354503db1824SAlex Lindsay MatCopyHashToXAIJ_Seq_Hash, 3546c2be7ffeSStefano Zampini NULL, 354703db1824SAlex Lindsay NULL}; 354817ab2063SBarry Smith 3549ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3550d71ae5a4SJacob Faibussowitsch { 3551bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 355297f1f81fSBarry Smith PetscInt i, nz, n; 3553bef8e0ddSBarry Smith 3554bef8e0ddSBarry Smith PetscFunctionBegin; 3555bef8e0ddSBarry Smith nz = aij->maxnz; 3556d0f46423SBarry Smith n = mat->rmap->n; 3557ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3558bef8e0ddSBarry Smith aij->nz = nz; 3559ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 35603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3561bef8e0ddSBarry Smith } 3562bef8e0ddSBarry Smith 3563a3bb6f32SFande Kong /* 3564ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3565ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3566ddea5d60SJunchao Zhang */ 3567d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3568d71ae5a4SJacob Faibussowitsch { 3569a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3570eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3571eec179cfSJacob Faibussowitsch PetscHashIter tpos; 357225b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 357325b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3574a3bb6f32SFande Kong 3575a3bb6f32SFande Kong PetscFunctionBegin; 3576a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 35774f572ea9SToby Isaac PetscAssertPointer(mapping, 2); 3578a3bb6f32SFande Kong /* use a table */ 3579eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3580a3bb6f32SFande Kong ec = 0; 358125b670f0SStefano Zampini for (i = 0; i < nz; i++) { 358225b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3583eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3584a3bb6f32SFande Kong if (!data) { 3585a3bb6f32SFande Kong /* one based table */ 3586c76ffc5fSJacob Faibussowitsch PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec)); 3587a3bb6f32SFande Kong } 3588a3bb6f32SFande Kong } 3589a3bb6f32SFande Kong /* form array of columns we need */ 35909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3591eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3592eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3593eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3594eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3595eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3596a3bb6f32SFande Kong gid--; 3597a3bb6f32SFande Kong lid--; 3598a3bb6f32SFande Kong garray[lid] = gid; 3599a3bb6f32SFande Kong } 36009566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3601eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3602c76ffc5fSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1)); 3603a3bb6f32SFande Kong /* compact out the extra columns in B */ 360425b670f0SStefano Zampini for (i = 0; i < nz; i++) { 360525b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3606eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3607a3bb6f32SFande Kong lid--; 360825b670f0SStefano Zampini jj[i] = lid; 3609a3bb6f32SFande Kong } 36109566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3611eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 36129566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36139566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36149566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 36153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3616a3bb6f32SFande Kong } 3617a3bb6f32SFande Kong 3618bef8e0ddSBarry Smith /*@ 3619bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3620bef8e0ddSBarry Smith in the matrix. 3621bef8e0ddSBarry Smith 3622bef8e0ddSBarry Smith Input Parameters: 362311a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3624bef8e0ddSBarry Smith - indices - the column indices 3625bef8e0ddSBarry Smith 362615091d37SBarry Smith Level: advanced 362715091d37SBarry Smith 3628bef8e0ddSBarry Smith Notes: 3629bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3630bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 363111a5261eSBarry Smith of the `MatSetValues()` operation. 3632bef8e0ddSBarry Smith 3633bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 363411a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3635bef8e0ddSBarry Smith 363611a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3637bef8e0ddSBarry Smith 3638b9617806SBarry Smith The indices should start with zero, not one. 3639b9617806SBarry Smith 36401cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ` 3641bef8e0ddSBarry Smith @*/ 3642d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3643d71ae5a4SJacob Faibussowitsch { 3644bef8e0ddSBarry Smith PetscFunctionBegin; 36450700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 36464f572ea9SToby Isaac PetscAssertPointer(indices, 2); 3647cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 36483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3649bef8e0ddSBarry Smith } 3650bef8e0ddSBarry Smith 3651ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3652d71ae5a4SJacob Faibussowitsch { 3653be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3654d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3655be6bf707SBarry Smith 3656be6bf707SBarry Smith PetscFunctionBegin; 365728b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3658be6bf707SBarry Smith 3659be6bf707SBarry Smith /* allocate space for values if not already there */ 36603a7d0413SPierre Jolivet if (!aij->saved_values) PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); 3661be6bf707SBarry Smith 3662be6bf707SBarry Smith /* copy values over */ 36639566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 36643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3665be6bf707SBarry Smith } 3666be6bf707SBarry Smith 3667be6bf707SBarry Smith /*@ 366820f4b53cSBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the 3669be6bf707SBarry Smith nonlinear portion. 3670be6bf707SBarry Smith 3671c3339decSBarry Smith Logically Collect 3672be6bf707SBarry Smith 367327430b45SBarry Smith Input Parameter: 367411a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3675be6bf707SBarry Smith 367615091d37SBarry Smith Level: advanced 367715091d37SBarry Smith 36782920cce0SJacob Faibussowitsch Example Usage: 367927430b45SBarry Smith .vb 36802ef1f0ffSBarry Smith Using SNES 368127430b45SBarry Smith Create Jacobian matrix 368227430b45SBarry Smith Set linear terms into matrix 368327430b45SBarry Smith Apply boundary conditions to matrix, at this time matrix must have 368427430b45SBarry Smith final nonzero structure (i.e. setting the nonlinear terms and applying 368527430b45SBarry Smith boundary conditions again will not change the nonzero structure 368627430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 368727430b45SBarry Smith MatStoreValues(mat); 368827430b45SBarry Smith Call SNESSetJacobian() with matrix 368927430b45SBarry Smith In your Jacobian routine 369027430b45SBarry Smith MatRetrieveValues(mat); 369127430b45SBarry Smith Set nonlinear terms in matrix 3692be6bf707SBarry Smith 369327430b45SBarry Smith Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself: 369427430b45SBarry Smith // build linear portion of Jacobian 369527430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 369627430b45SBarry Smith MatStoreValues(mat); 369727430b45SBarry Smith loop over nonlinear iterations 369827430b45SBarry Smith MatRetrieveValues(mat); 369927430b45SBarry Smith // call MatSetValues(mat,...) to set nonliner portion of Jacobian 370027430b45SBarry Smith // call MatAssemblyBegin/End() on matrix 370127430b45SBarry Smith Solve linear system with Jacobian 370227430b45SBarry Smith endloop 370327430b45SBarry Smith .ve 3704be6bf707SBarry Smith 3705be6bf707SBarry Smith Notes: 3706da81f932SPierre Jolivet Matrix must already be assembled before calling this routine 370711a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3708be6bf707SBarry Smith calling this routine. 3709be6bf707SBarry Smith 37100c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37110c468ba9SBarry Smith and does not allocated additional space. 37120c468ba9SBarry Smith 3713fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()` 3714be6bf707SBarry Smith @*/ 3715d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3716d71ae5a4SJacob Faibussowitsch { 3717be6bf707SBarry Smith PetscFunctionBegin; 37180700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 371928b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 372028b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3721cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 37223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3723be6bf707SBarry Smith } 3724be6bf707SBarry Smith 3725ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3726d71ae5a4SJacob Faibussowitsch { 3727be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3728d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3729be6bf707SBarry Smith 3730be6bf707SBarry Smith PetscFunctionBegin; 373128b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 373228b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3733be6bf707SBarry Smith /* copy values over */ 37349566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 37353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3736be6bf707SBarry Smith } 3737be6bf707SBarry Smith 3738be6bf707SBarry Smith /*@ 373920f4b53cSBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()` 3740be6bf707SBarry Smith 3741c3339decSBarry Smith Logically Collect 3742be6bf707SBarry Smith 37432fe279fdSBarry Smith Input Parameter: 374411a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3745be6bf707SBarry Smith 374615091d37SBarry Smith Level: advanced 374715091d37SBarry Smith 37481cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()` 3749be6bf707SBarry Smith @*/ 3750d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3751d71ae5a4SJacob Faibussowitsch { 3752be6bf707SBarry Smith PetscFunctionBegin; 37530700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 375428b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 375528b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3756cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 37573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3758be6bf707SBarry Smith } 3759be6bf707SBarry Smith 37605d83a8b1SBarry Smith /*@ 376111a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 37620d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 376320f4b53cSBarry Smith the user should preallocate the matrix storage by setting the parameter `nz` 376420f4b53cSBarry Smith (or the array `nnz`). 376517ab2063SBarry Smith 3766d083f849SBarry Smith Collective 3767db81eaa0SLois Curfman McInnes 376817ab2063SBarry Smith Input Parameters: 376911a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 377017ab2063SBarry Smith . m - number of rows 377117ab2063SBarry Smith . n - number of columns 377217ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 377351c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 37740298fd71SBarry Smith (possibly different for each row) or NULL 377517ab2063SBarry Smith 377617ab2063SBarry Smith Output Parameter: 3777416022c9SBarry Smith . A - the matrix 377817ab2063SBarry Smith 37792ef1f0ffSBarry Smith Options Database Keys: 37802ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 37812ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 37822ef1f0ffSBarry Smith 37832ef1f0ffSBarry Smith Level: intermediate 3784175b88e8SBarry Smith 3785b259b22eSLois Curfman McInnes Notes: 378677433607SBarry Smith It is recommend to use `MatCreateFromOptions()` instead of this routine 378777433607SBarry Smith 37882ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 378949a6f317SBarry Smith 37902ef1f0ffSBarry Smith The `MATSEQAIJ` format, also called 37912ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 37920002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 37932ef1f0ffSBarry Smith either one (as in Fortran) or zero. 379417ab2063SBarry Smith 379520f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 37962ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 379720f4b53cSBarry Smith allocation. 379817ab2063SBarry Smith 3799682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38004fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3801682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38026c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38036c7ebb05SLois Curfman McInnes 38041cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 380517ab2063SBarry Smith @*/ 3806d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3807d71ae5a4SJacob Faibussowitsch { 38083a40ed3dSBarry Smith PetscFunctionBegin; 38099566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38109566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38119566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 38133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3814273d9f13SBarry Smith } 3815273d9f13SBarry Smith 38165d83a8b1SBarry Smith /*@ 3817273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3818273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3819273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3820273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3821273d9f13SBarry Smith 3822d083f849SBarry Smith Collective 3823273d9f13SBarry Smith 3824273d9f13SBarry Smith Input Parameters: 38251c4f3114SJed Brown + B - The matrix 3826273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3827273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38280298fd71SBarry Smith (possibly different for each row) or NULL 3829273d9f13SBarry Smith 38302ef1f0ffSBarry Smith Options Database Keys: 38312ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 38322ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 38332ef1f0ffSBarry Smith 38342ef1f0ffSBarry Smith Level: intermediate 38352ef1f0ffSBarry Smith 3836273d9f13SBarry Smith Notes: 38372ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 383849a6f317SBarry Smith 383911a5261eSBarry Smith The `MATSEQAIJ` format also called 38402ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 3841273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3842273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3843273d9f13SBarry Smith 38442ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 38452ef1f0ffSBarry Smith Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 38462ef1f0ffSBarry Smith allocation. 3847273d9f13SBarry Smith 384811a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3849aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3850aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3851aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3852aa95bbe8SBarry Smith 385311a5261eSBarry Smith Developer Notes: 385411a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3855a96a251dSBarry Smith entries or columns indices 3856a96a251dSBarry Smith 3857273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3858273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3859273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3860273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3861273d9f13SBarry Smith 38621cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3863db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3864273d9f13SBarry Smith @*/ 3865d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3866d71ae5a4SJacob Faibussowitsch { 3867a23d5eceSKris Buschelman PetscFunctionBegin; 38686ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 38696ba663aaSJed Brown PetscValidType(B, 1); 3870cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 38713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3872a23d5eceSKris Buschelman } 3873a23d5eceSKris Buschelman 3874d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3875d71ae5a4SJacob Faibussowitsch { 3876ad79cf63SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 38772576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 387897f1f81fSBarry Smith PetscInt i; 3879273d9f13SBarry Smith 3880273d9f13SBarry Smith PetscFunctionBegin; 3881ad79cf63SBarry Smith if (B->hash_active) { 3882aea10558SJacob Faibussowitsch B->ops[0] = b->cops; 3883ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 3884ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 3885ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 3886ad79cf63SBarry Smith } 38872576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3888a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3889c461c341SBarry Smith skipallocation = PETSC_TRUE; 3890c461c341SBarry Smith nz = 0; 3891c461c341SBarry Smith } 38929566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 38939566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3894899cda47SBarry Smith 3895435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 389608401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 38979f0612e4SBarry Smith if (nnz) { 3898d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 389908401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 390008401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3901b73539f3SBarry Smith } 3902b73539f3SBarry Smith } 3903b73539f3SBarry Smith 3904273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 3905ab93d7beSBarry Smith if (!skipallocation) { 39063a7d0413SPierre Jolivet if (!b->imax) PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); 3907071fcb05SBarry Smith if (!b->ilen) { 3908071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39099566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3910071fcb05SBarry Smith } else { 39119566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39122ee49352SLisandro Dalcin } 3913aa624791SPierre Jolivet if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); 3914273d9f13SBarry Smith if (!nnz) { 3915435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3916c62bd62aSJed Brown else if (nz < 0) nz = 1; 39175d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 3918d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 3919c43c4a61SBarry Smith PetscCall(PetscIntMultError(nz, B->rmap->n, &nz)); 3920273d9f13SBarry Smith } else { 3921c73702f5SBarry Smith PetscInt64 nz64 = 0; 39229371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 39239371c9d4SSatish Balay b->imax[i] = nnz[i]; 39249371c9d4SSatish Balay nz64 += nnz[i]; 39259371c9d4SSatish Balay } 39269566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 3927273d9f13SBarry Smith } 3928ab93d7beSBarry Smith 3929273d9f13SBarry Smith /* allocate the matrix space */ 39309566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 39319f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscInt), (void **)&b->j)); 39329f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(B->rmap->n + 1, sizeof(PetscInt), (void **)&b->i)); 39339f0612e4SBarry Smith b->free_ij = PETSC_TRUE; 3934396832f4SHong Zhang if (B->structure_only) { 39359f0612e4SBarry Smith b->free_a = PETSC_FALSE; 3936396832f4SHong Zhang } else { 39379f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscScalar), (void **)&b->a)); 39389f0612e4SBarry Smith b->free_a = PETSC_TRUE; 3939396832f4SHong Zhang } 3940bfeeae90SHong Zhang b->i[0] = 0; 3941ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 3942c461c341SBarry Smith } else { 3943e6b907acSBarry Smith b->free_a = PETSC_FALSE; 3944e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 3945c461c341SBarry Smith } 3946273d9f13SBarry Smith 3947846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 3948846b4da1SFande Kong /* reserve user-requested sparsity */ 39499566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 3950846b4da1SFande Kong } 3951846b4da1SFande Kong 3952273d9f13SBarry Smith b->nz = 0; 3953273d9f13SBarry Smith b->maxnz = nz; 3954273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 39551baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 3956cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 3957cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 39585519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 39595519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 39605519a089SJose E. Roman */ 39615519a089SJose E. Roman B->nonzerostate++; 39623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3963273d9f13SBarry Smith } 3964273d9f13SBarry Smith 39654c51d546SAlexander PetscErrorCode MatResetPreallocation_SeqAIJ_Private(Mat A, PetscBool *memoryreset) 3966d71ae5a4SJacob Faibussowitsch { 3967846b4da1SFande Kong Mat_SeqAIJ *a; 3968a5bbaf83SFande Kong PetscInt i; 39691f14be2bSBarry Smith PetscBool skipreset; 3970846b4da1SFande Kong 3971846b4da1SFande Kong PetscFunctionBegin; 3972846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 397314d0e64fSAlex Lindsay 39744c51d546SAlexander PetscCheck(A->insertmode == NOT_SET_VALUES, PETSC_COMM_SELF, PETSC_ERR_SUP, "Cannot reset preallocation after setting some values but not yet calling MatAssemblyBegin()/MatAssemblyEnd()"); 39754c51d546SAlexander if (A->num_ass == 0) PetscFunctionReturn(PETSC_SUCCESS); 39764c51d546SAlexander 397714d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 39783ba16761SJacob Faibussowitsch if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS); 397914d0e64fSAlex Lindsay 3980846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 39812c814fdeSFande Kong /* if no saved info, we error out */ 398228b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 39832c814fdeSFande Kong 39841f14be2bSBarry Smith PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and cannot reset preallocation "); 39852c814fdeSFande Kong 39861f14be2bSBarry Smith PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset)); 39874c51d546SAlexander if (skipreset) PetscCall(MatZeroEntries(A)); 39884c51d546SAlexander else { 39899566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 39909566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 3991846b4da1SFande Kong a->i[0] = 0; 3992ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 3993846b4da1SFande Kong A->preallocated = PETSC_TRUE; 3994846b4da1SFande Kong a->nz = 0; 3995846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 3996846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 3997846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 3998846b4da1SFande Kong A->assembled = PETSC_FALSE; 3999b3a35320SAlex Lindsay A->nonzerostate++; 4000b3a35320SAlex Lindsay /* Log that the state of this object has changed; this will help guarantee that preconditioners get re-setup */ 4001b3a35320SAlex Lindsay PetscCall(PetscObjectStateIncrease((PetscObject)A)); 40021f14be2bSBarry Smith } 40034c51d546SAlexander if (memoryreset) *memoryreset = (PetscBool)!skipreset; 40044c51d546SAlexander PetscFunctionReturn(PETSC_SUCCESS); 40054c51d546SAlexander } 40064c51d546SAlexander 40074c51d546SAlexander static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 40084c51d546SAlexander { 40094c51d546SAlexander PetscFunctionBegin; 40104c51d546SAlexander PetscCall(MatResetPreallocation_SeqAIJ_Private(A, NULL)); 40113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4012846b4da1SFande Kong } 4013846b4da1SFande Kong 401458d36128SBarry Smith /*@ 401511a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4016a1661176SMatthew Knepley 4017a1661176SMatthew Knepley Input Parameters: 4018a1661176SMatthew Knepley + B - the matrix 4019d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero) 4020d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row 4021d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided 4022a1661176SMatthew Knepley 4023a1661176SMatthew Knepley Level: developer 4024a1661176SMatthew Knepley 40256a9b8d82SBarry Smith Notes: 40262ef1f0ffSBarry Smith The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 402758d36128SBarry Smith 40286a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 40296a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 40306a9b8d82SBarry Smith 40316a9b8d82SBarry Smith Developer Notes: 40322ef1f0ffSBarry Smith An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and 40332ef1f0ffSBarry Smith then just copies the `v` values directly with `PetscMemcpy()`. 40346a9b8d82SBarry Smith 403511a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 40366a9b8d82SBarry Smith 4037fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()` 4038a1661176SMatthew Knepley @*/ 4039d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4040d71ae5a4SJacob Faibussowitsch { 4041a1661176SMatthew Knepley PetscFunctionBegin; 40420700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 40436ba663aaSJed Brown PetscValidType(B, 1); 4044cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 40453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4046a1661176SMatthew Knepley } 4047a1661176SMatthew Knepley 4048ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4049d71ae5a4SJacob Faibussowitsch { 4050a1661176SMatthew Knepley PetscInt i; 4051a1661176SMatthew Knepley PetscInt m, n; 4052a1661176SMatthew Knepley PetscInt nz; 40536a9b8d82SBarry Smith PetscInt *nnz; 4054a1661176SMatthew Knepley 4055a1661176SMatthew Knepley PetscFunctionBegin; 4056aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4057779a8d59SSatish Balay 40589566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 40599566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4060779a8d59SSatish Balay 40619566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 40629566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4063a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4064b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 406508401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4066a1661176SMatthew Knepley nnz[i] = nz; 4067a1661176SMatthew Knepley } 40689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 40699566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4070a1661176SMatthew Knepley 40718e3a54c0SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES)); 4072a1661176SMatthew Knepley 40739566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 40749566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4075a1661176SMatthew Knepley 40769566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 40773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4078a1661176SMatthew Knepley } 4079a1661176SMatthew Knepley 4080ad7e164aSPierre Jolivet /*@ 40812ef1f0ffSBarry Smith MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`. 4082ad7e164aSPierre Jolivet 4083ad7e164aSPierre Jolivet Input Parameters: 4084ad7e164aSPierre Jolivet + A - left-hand side matrix 4085ad7e164aSPierre Jolivet . B - right-hand side matrix 408611a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4087ad7e164aSPierre Jolivet 4088ad7e164aSPierre Jolivet Output Parameter: 40892ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B` 4090ad7e164aSPierre Jolivet 4091ad7e164aSPierre Jolivet Level: intermediate 4092ad7e164aSPierre Jolivet 409311a5261eSBarry Smith Note: 409411a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4095ad7e164aSPierre Jolivet 40961cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4097ad7e164aSPierre Jolivet @*/ 4098d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4099d71ae5a4SJacob Faibussowitsch { 4100ad7e164aSPierre Jolivet PetscFunctionBegin; 4101ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4102ad7e164aSPierre Jolivet PetscValidType(A, 1); 4103ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4104ad7e164aSPierre Jolivet PetscValidType(B, 2); 41054f572ea9SToby Isaac PetscAssertPointer(C, 4); 4106ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4107ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4108ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4109ad7e164aSPierre Jolivet } 4110cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 41113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4112ad7e164aSPierre Jolivet } 4113ad7e164aSPierre Jolivet 4114ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4115d71ae5a4SJacob Faibussowitsch { 4116ad7e164aSPierre Jolivet Mat newmat; 4117ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4118ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4119ad7e164aSPierre Jolivet PetscScalar *v; 4120fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4121ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4122ad7e164aSPierre Jolivet PetscBool flg; 4123ad7e164aSPierre Jolivet 4124ad7e164aSPierre Jolivet PetscFunctionBegin; 412528b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 412628b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 412728b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 412828b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 41299566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 413028b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4131aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4132ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 41339566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 41349566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 41359566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 41369566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4137ad7e164aSPierre Jolivet i[0] = 0; 4138ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4139ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4140ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4141ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4142ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4143ad7e164aSPierre Jolivet } 4144ad7e164aSPierre Jolivet } 4145ad7e164aSPierre Jolivet } 41469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4147ad7e164aSPierre Jolivet *C = newmat; 41489566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4149ad7e164aSPierre Jolivet nnz = 0; 4150ad7e164aSPierre Jolivet } 41519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 41529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 41539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4154ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4155ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4156ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4157ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4158ad7e164aSPierre Jolivet } 4159ad7e164aSPierre Jolivet } 4160ad7e164aSPierre Jolivet } 41619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 41629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 41639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 41643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4165ad7e164aSPierre Jolivet } 4166ad7e164aSPierre Jolivet 4167c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4168af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4169170fe5c8SBarry Smith 4170170fe5c8SBarry Smith /* 4171170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4172170fe5c8SBarry Smith 4173170fe5c8SBarry Smith n p p 41742da392ccSBarry Smith [ ] [ ] [ ] 41752da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 41762da392ccSBarry Smith [ ] [ ] [ ] 4177170fe5c8SBarry Smith 4178170fe5c8SBarry Smith */ 4179d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4180d71ae5a4SJacob Faibussowitsch { 4181170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4182170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4183170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 418486214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4185170fe5c8SBarry Smith const PetscInt *ii, *idx; 4186170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4187170fe5c8SBarry Smith PetscScalar *c, *c_q; 418886214ceeSStefano Zampini PetscInt clda = sub_c->lda; 418986214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4190170fe5c8SBarry Smith 4191170fe5c8SBarry Smith PetscFunctionBegin; 4192d0f46423SBarry Smith m = A->rmap->n; 4193d0f46423SBarry Smith n = A->cmap->n; 4194d0f46423SBarry Smith p = B->cmap->n; 4195170fe5c8SBarry Smith a = sub_a->v; 4196170fe5c8SBarry Smith b = sub_b->a; 4197170fe5c8SBarry Smith c = sub_c->v; 419886214ceeSStefano Zampini if (clda == m) { 41999566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 420086214ceeSStefano Zampini } else { 420186214ceeSStefano Zampini for (j = 0; j < p; j++) 42029371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 420386214ceeSStefano Zampini } 4204170fe5c8SBarry Smith ii = sub_b->i; 4205170fe5c8SBarry Smith idx = sub_b->j; 4206170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4207170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4208170fe5c8SBarry Smith while (q-- > 0) { 420986214ceeSStefano Zampini c_q = c + clda * (*idx); 421086214ceeSStefano Zampini a_q = a + alda * i; 4211854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4212170fe5c8SBarry Smith idx++; 4213170fe5c8SBarry Smith b++; 4214170fe5c8SBarry Smith } 4215170fe5c8SBarry Smith } 42163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4217170fe5c8SBarry Smith } 4218170fe5c8SBarry Smith 4219d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4220d71ae5a4SJacob Faibussowitsch { 4221d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 422286214ceeSStefano Zampini PetscBool cisdense; 4223170fe5c8SBarry Smith 4224170fe5c8SBarry Smith PetscFunctionBegin; 422508401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 42269566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 42279566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 4228d5e393b6SSuyash Tandon PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, "")); 422948a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 42309566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4231d73949e8SHong Zhang 42324222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 42333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4234170fe5c8SBarry Smith } 4235170fe5c8SBarry Smith 42360bad9183SKris Buschelman /*MC 4237fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 42380bad9183SKris Buschelman based on compressed sparse row format. 42390bad9183SKris Buschelman 42402ef1f0ffSBarry Smith Options Database Key: 42410bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 42420bad9183SKris Buschelman 42430bad9183SKris Buschelman Level: beginner 42440bad9183SKris Buschelman 42450cd7f59aSBarry Smith Notes: 42462ef1f0ffSBarry Smith `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values, 42470cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 42480cd7f59aSBarry Smith in the matrix 42490cd7f59aSBarry Smith 425011a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 425111a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 42520cd7f59aSBarry Smith 425311a5261eSBarry Smith Developer Note: 42542ef1f0ffSBarry Smith It would be nice if all matrix formats supported passing `NULL` in for the numerical values 42550cd7f59aSBarry Smith 42561cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 42570bad9183SKris Buschelman M*/ 42580bad9183SKris Buschelman 4259ccd284c7SBarry Smith /*MC 4260ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4261ccd284c7SBarry Smith 426211a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 426311a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 426411a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4265ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4266ccd284c7SBarry Smith the above preallocation routines for simplicity. 4267ccd284c7SBarry Smith 42682ef1f0ffSBarry Smith Options Database Key: 426911a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4270ccd284c7SBarry Smith 42712ef1f0ffSBarry Smith Level: beginner 42722ef1f0ffSBarry Smith 427311a5261eSBarry Smith Note: 427411a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4275ccd284c7SBarry Smith enough exist. 4276ccd284c7SBarry Smith 42771cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4278ccd284c7SBarry Smith M*/ 4279ccd284c7SBarry Smith 4280ccd284c7SBarry Smith /*MC 4281ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4282ccd284c7SBarry Smith 42832ef1f0ffSBarry Smith Options Database Key: 42842ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 42852ef1f0ffSBarry Smith 42862ef1f0ffSBarry Smith Level: beginner 42872ef1f0ffSBarry Smith 42882ef1f0ffSBarry Smith Note: 428911a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 429011a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 429111a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4292ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4293ccd284c7SBarry Smith the above preallocation routines for simplicity. 4294ccd284c7SBarry Smith 42951cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4296ccd284c7SBarry Smith M*/ 4297ccd284c7SBarry Smith 42987906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 42997906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43007906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43017906f579SHong Zhang #endif 4302d1a032dbSPierre Jolivet #if defined(PETSC_HAVE_SCALAPACK) && (defined(PETSC_USE_REAL_SINGLE) || defined(PETSC_USE_REAL_DOUBLE)) 4303d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4304d24d4204SJose E. Roman #endif 43057906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43067906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43077906f579SHong Zhang #endif 43087906f579SHong Zhang 4309d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4310c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43114222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43127906f579SHong Zhang 43138c778c55SBarry Smith /*@C 431411a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43158c778c55SBarry Smith 43168c778c55SBarry Smith Not Collective 43178c778c55SBarry Smith 43188c778c55SBarry Smith Input Parameter: 4319fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 43208c778c55SBarry Smith 43218c778c55SBarry Smith Output Parameter: 43228c778c55SBarry Smith . array - pointer to the data 43238c778c55SBarry Smith 43248c778c55SBarry Smith Level: intermediate 43258c778c55SBarry Smith 4326ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()` 43278c778c55SBarry Smith @*/ 43285d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar *array[]) 4329d71ae5a4SJacob Faibussowitsch { 4330d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 43318c778c55SBarry Smith 43328c778c55SBarry Smith PetscFunctionBegin; 4333d67d9f35SJunchao Zhang if (aij->ops->getarray) { 43349566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4335d67d9f35SJunchao Zhang } else { 4336d67d9f35SJunchao Zhang *array = aij->a; 4337d67d9f35SJunchao Zhang } 43383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4339d67d9f35SJunchao Zhang } 4340d67d9f35SJunchao Zhang 4341d67d9f35SJunchao Zhang /*@C 434211a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4343d67d9f35SJunchao Zhang 4344d67d9f35SJunchao Zhang Not Collective 4345d67d9f35SJunchao Zhang 4346d67d9f35SJunchao Zhang Input Parameters: 4347fe59aa6dSJacob Faibussowitsch + A - a `MATSEQAIJ` matrix 4348d67d9f35SJunchao Zhang - array - pointer to the data 4349d67d9f35SJunchao Zhang 4350d67d9f35SJunchao Zhang Level: intermediate 4351d67d9f35SJunchao Zhang 4352ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()` 4353d67d9f35SJunchao Zhang @*/ 43545d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar *array[]) 4355d71ae5a4SJacob Faibussowitsch { 4356d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4357d67d9f35SJunchao Zhang 4358d67d9f35SJunchao Zhang PetscFunctionBegin; 4359d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 43609566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4361d67d9f35SJunchao Zhang } else { 4362d67d9f35SJunchao Zhang *array = NULL; 4363d67d9f35SJunchao Zhang } 43649566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 43653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 43668c778c55SBarry Smith } 43678c778c55SBarry Smith 436821e72a00SBarry Smith /*@C 436911a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 43708f1ea47aSStefano Zampini 43710ab4885dSBarry Smith Not Collective; No Fortran Support 43728f1ea47aSStefano Zampini 43738f1ea47aSStefano Zampini Input Parameter: 4374fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 43758f1ea47aSStefano Zampini 43768f1ea47aSStefano Zampini Output Parameter: 43778f1ea47aSStefano Zampini . array - pointer to the data 43788f1ea47aSStefano Zampini 43798f1ea47aSStefano Zampini Level: intermediate 43808f1ea47aSStefano Zampini 43811cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 43828f1ea47aSStefano Zampini @*/ 43835d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar *array[]) 4384d71ae5a4SJacob Faibussowitsch { 4385d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 43868f1ea47aSStefano Zampini 43878f1ea47aSStefano Zampini PetscFunctionBegin; 4388d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 43899566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4390d67d9f35SJunchao Zhang } else { 4391d67d9f35SJunchao Zhang *array = aij->a; 4392d67d9f35SJunchao Zhang } 43933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 43948f1ea47aSStefano Zampini } 43958f1ea47aSStefano Zampini 43968f1ea47aSStefano Zampini /*@C 439711a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 43988f1ea47aSStefano Zampini 43990ab4885dSBarry Smith Not Collective; No Fortran Support 44008f1ea47aSStefano Zampini 44018f1ea47aSStefano Zampini Input Parameter: 4402fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44038f1ea47aSStefano Zampini 44048f1ea47aSStefano Zampini Output Parameter: 44058f1ea47aSStefano Zampini . array - pointer to the data 44068f1ea47aSStefano Zampini 44078f1ea47aSStefano Zampini Level: intermediate 44088f1ea47aSStefano Zampini 44091cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44108f1ea47aSStefano Zampini @*/ 44115d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar *array[]) 4412d71ae5a4SJacob Faibussowitsch { 4413d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44148f1ea47aSStefano Zampini 44158f1ea47aSStefano Zampini PetscFunctionBegin; 4416d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44179566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4418d67d9f35SJunchao Zhang } else { 4419d67d9f35SJunchao Zhang *array = NULL; 4420d67d9f35SJunchao Zhang } 44213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4422d67d9f35SJunchao Zhang } 4423d67d9f35SJunchao Zhang 4424d67d9f35SJunchao Zhang /*@C 442511a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4426d67d9f35SJunchao Zhang 44270ab4885dSBarry Smith Not Collective; No Fortran Support 4428d67d9f35SJunchao Zhang 4429d67d9f35SJunchao Zhang Input Parameter: 4430fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 4431d67d9f35SJunchao Zhang 4432d67d9f35SJunchao Zhang Output Parameter: 4433d67d9f35SJunchao Zhang . array - pointer to the data 4434d67d9f35SJunchao Zhang 4435d67d9f35SJunchao Zhang Level: intermediate 4436d67d9f35SJunchao Zhang 44371cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4438d67d9f35SJunchao Zhang @*/ 44395d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar *array[]) 4440d71ae5a4SJacob Faibussowitsch { 4441d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4442d67d9f35SJunchao Zhang 4443d67d9f35SJunchao Zhang PetscFunctionBegin; 4444d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 44459566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4446d67d9f35SJunchao Zhang } else { 4447d67d9f35SJunchao Zhang *array = aij->a; 4448d67d9f35SJunchao Zhang } 44499566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4451d67d9f35SJunchao Zhang } 4452d67d9f35SJunchao Zhang 4453d67d9f35SJunchao Zhang /*@C 4454d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4455d67d9f35SJunchao Zhang 44560ab4885dSBarry Smith Not Collective; No Fortran Support 4457d67d9f35SJunchao Zhang 4458d67d9f35SJunchao Zhang Input Parameter: 4459fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix 4460d67d9f35SJunchao Zhang 4461d67d9f35SJunchao Zhang Output Parameter: 4462d67d9f35SJunchao Zhang . array - pointer to the data 4463d67d9f35SJunchao Zhang 4464d67d9f35SJunchao Zhang Level: intermediate 4465d67d9f35SJunchao Zhang 44661cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4467d67d9f35SJunchao Zhang @*/ 44685d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar *array[]) 4469d71ae5a4SJacob Faibussowitsch { 4470d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4471d67d9f35SJunchao Zhang 4472d67d9f35SJunchao Zhang PetscFunctionBegin; 4473d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 44749566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4475d67d9f35SJunchao Zhang } else { 4476d67d9f35SJunchao Zhang *array = NULL; 4477d67d9f35SJunchao Zhang } 44783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44798f1ea47aSStefano Zampini } 44808f1ea47aSStefano Zampini 44818f1ea47aSStefano Zampini /*@C 448211a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 44837ee59b9bSJunchao Zhang 44840ab4885dSBarry Smith Not Collective; No Fortran Support 44857ee59b9bSJunchao Zhang 44867ee59b9bSJunchao Zhang Input Parameter: 448711a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 44887ee59b9bSJunchao Zhang 44897ee59b9bSJunchao Zhang Output Parameters: 44907ee59b9bSJunchao Zhang + i - row map array of the matrix 44917ee59b9bSJunchao Zhang . j - column index array of the matrix 44927ee59b9bSJunchao Zhang . a - data array of the matrix 4493fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays 44947ee59b9bSJunchao Zhang 4495fe59aa6dSJacob Faibussowitsch Level: developer 44962ef1f0ffSBarry Smith 44977ee59b9bSJunchao Zhang Notes: 44982ef1f0ffSBarry Smith Any of the output parameters can be `NULL`, in which case the corresponding value is not returned. 44997ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45007ee59b9bSJunchao Zhang 45017ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45022ef1f0ffSBarry Smith If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix. 45037ee59b9bSJunchao Zhang 45041cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45057ee59b9bSJunchao Zhang @*/ 45065d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt *i[], const PetscInt *j[], PetscScalar *a[], PetscMemType *mtype) 4507d71ae5a4SJacob Faibussowitsch { 45087ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45097ee59b9bSJunchao Zhang 45107ee59b9bSJunchao Zhang PetscFunctionBegin; 45117ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45127ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45137ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45147ee59b9bSJunchao Zhang } else { 45157ee59b9bSJunchao Zhang if (i) *i = aij->i; 45167ee59b9bSJunchao Zhang if (j) *j = aij->j; 45177ee59b9bSJunchao Zhang if (a) *a = aij->a; 45187ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 45197ee59b9bSJunchao Zhang } 45203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45217ee59b9bSJunchao Zhang } 45227ee59b9bSJunchao Zhang 4523cc4c1da9SBarry Smith /*@ 452421e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 452521e72a00SBarry Smith 452621e72a00SBarry Smith Not Collective 452721e72a00SBarry Smith 452821e72a00SBarry Smith Input Parameter: 4529fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 453021e72a00SBarry Smith 453121e72a00SBarry Smith Output Parameter: 453221e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 453321e72a00SBarry Smith 453421e72a00SBarry Smith Level: intermediate 453521e72a00SBarry Smith 4536ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()` 453721e72a00SBarry Smith @*/ 4538d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4539d71ae5a4SJacob Faibussowitsch { 454021e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 454121e72a00SBarry Smith 454221e72a00SBarry Smith PetscFunctionBegin; 454321e72a00SBarry Smith *nz = aij->rmax; 45443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 454521e72a00SBarry Smith } 454621e72a00SBarry Smith 454749abdd8aSBarry Smith static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void **data) 45482c4ab24aSJunchao Zhang { 454949abdd8aSBarry Smith MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)*data; 45504d86920dSPierre Jolivet 45512c4ab24aSJunchao Zhang PetscFunctionBegin; 45522c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->perm)); 45532c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->jmap)); 45542c4ab24aSJunchao Zhang PetscCall(PetscFree(coo)); 45552c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS); 45562c4ab24aSJunchao Zhang } 45572c4ab24aSJunchao Zhang 4558d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4559d71ae5a4SJacob Faibussowitsch { 4560394ed5ebSJunchao Zhang MPI_Comm comm; 4561394ed5ebSJunchao Zhang PetscInt *i, *j; 45620d88f7f4SJunchao Zhang PetscInt M, N, row, iprev; 4563394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4564394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4565394ed5ebSJunchao Zhang PetscInt *Aj; 4566394ed5ebSJunchao Zhang PetscScalar *Aa; 4567f4f49eeaSPierre Jolivet Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)mat->data; 4568cbc6b225SStefano Zampini MatType rtype; 4569394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 45702c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 45710d88f7f4SJunchao Zhang PetscBool isorted; 45729f0612e4SBarry Smith PetscBool hypre; 4573394ed5ebSJunchao Zhang 4574394ed5ebSJunchao Zhang PetscFunctionBegin; 45759566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 45769566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4577e8729f6fSJunchao Zhang i = coo_i; 4578e8729f6fSJunchao Zhang j = coo_j; 45799566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 45800d88f7f4SJunchao Zhang 45810d88f7f4SJunchao Zhang /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */ 45820d88f7f4SJunchao Zhang isorted = PETSC_TRUE; 45830d88f7f4SJunchao Zhang iprev = PETSC_INT_MIN; 45840d88f7f4SJunchao Zhang for (k = 0; k < coo_n; k++) { 4585394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 45860d88f7f4SJunchao Zhang if (isorted) { 45870d88f7f4SJunchao Zhang if (i[k] < iprev) isorted = PETSC_FALSE; 45880d88f7f4SJunchao Zhang else iprev = i[k]; 45890d88f7f4SJunchao Zhang } 4590394ed5ebSJunchao Zhang perm[k] = k; 4591394ed5ebSJunchao Zhang } 4592394ed5ebSJunchao Zhang 45930d88f7f4SJunchao Zhang /* Sort by row if not already */ 45940d88f7f4SJunchao Zhang if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 45952b35a777SBarry Smith PetscCheck(coo_n == 0 || i[coo_n - 1] < M, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "COO row index %" PetscInt_FMT " is >= the matrix row size %" PetscInt_FMT, i[coo_n - 1], M); 4596651b1cf9SStefano Zampini 4597651b1cf9SStefano Zampini /* Advance k to the first row with a non-negative index */ 4598651b1cf9SStefano Zampini for (k = 0; k < coo_n; k++) 45999371c9d4SSatish Balay if (i[k] >= 0) break; 4600394ed5ebSJunchao Zhang nneg = k; 46019566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4602394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 460335cb6cd3SPierre Jolivet jmap++; /* Inc jmap by 1 for convenience */ 4604394ed5ebSJunchao Zhang 46059f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(M + 1, sizeof(PetscInt), (void **)&Ai)); /* CSR of A */ 46069f0612e4SBarry Smith PetscCall(PetscArrayzero(Ai, M + 1)); 46079f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(coo_n - nneg, sizeof(PetscInt), (void **)&Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4608394ed5ebSJunchao Zhang 460921fb621cSStefano Zampini PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", ((PetscObject)mat)->name, &hypre)); 4610651b1cf9SStefano Zampini 4611394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 461235cb6cd3SPierre Jolivet Ai++; /* Inc by 1 for convenience */ 4613394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4614394ed5ebSJunchao Zhang while (k < coo_n) { 46150d88f7f4SJunchao Zhang PetscBool strictly_sorted; // this row is strictly sorted? 46160d88f7f4SJunchao Zhang PetscInt jprev; 46170d88f7f4SJunchao Zhang 46180d88f7f4SJunchao Zhang /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */ 4619394ed5ebSJunchao Zhang row = i[k]; 46200d88f7f4SJunchao Zhang start = k; 46210d88f7f4SJunchao Zhang jprev = PETSC_INT_MIN; 46220d88f7f4SJunchao Zhang strictly_sorted = PETSC_TRUE; 46230d88f7f4SJunchao Zhang while (k < coo_n && i[k] == row) { 46240d88f7f4SJunchao Zhang if (strictly_sorted) { 46250d88f7f4SJunchao Zhang if (j[k] <= jprev) strictly_sorted = PETSC_FALSE; 46260d88f7f4SJunchao Zhang else jprev = j[k]; 46270d88f7f4SJunchao Zhang } 46280d88f7f4SJunchao Zhang k++; 46290d88f7f4SJunchao Zhang } 4630394ed5ebSJunchao Zhang end = k; 46310d88f7f4SJunchao Zhang 4632651b1cf9SStefano Zampini /* hack for HYPRE: swap min column to diag so that diagonal values will go first */ 4633651b1cf9SStefano Zampini if (hypre) { 46341690c2aeSBarry Smith PetscInt minj = PETSC_INT_MAX; 4635651b1cf9SStefano Zampini PetscBool hasdiag = PETSC_FALSE; 46360d88f7f4SJunchao Zhang 46370d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to swap the first and the diag 46380d88f7f4SJunchao Zhang PetscCount tmp; 46390d88f7f4SJunchao Zhang for (p = start; p < end; p++) { 46400d88f7f4SJunchao Zhang if (j[p] == row && p != start) { 46411c265611SJunchao Zhang j[p] = j[start]; // swap j[], so that the diagonal value will go first (manipulated by perm[]) 46420d88f7f4SJunchao Zhang j[start] = row; 46430d88f7f4SJunchao Zhang tmp = perm[start]; 46441c265611SJunchao Zhang perm[start] = perm[p]; // also swap perm[] so we can save the call to PetscSortIntWithCountArray() below 46450d88f7f4SJunchao Zhang perm[p] = tmp; 46460d88f7f4SJunchao Zhang break; 46470d88f7f4SJunchao Zhang } 46480d88f7f4SJunchao Zhang } 46490d88f7f4SJunchao Zhang } else { 4650651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4651651b1cf9SStefano Zampini hasdiag = (PetscBool)(hasdiag || (j[p] == row)); 4652651b1cf9SStefano Zampini minj = PetscMin(minj, j[p]); 4653651b1cf9SStefano Zampini } 46540d88f7f4SJunchao Zhang 4655651b1cf9SStefano Zampini if (hasdiag) { 4656651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4657651b1cf9SStefano Zampini if (j[p] == minj) j[p] = row; 4658651b1cf9SStefano Zampini else if (j[p] == row) j[p] = minj; 4659651b1cf9SStefano Zampini } 4660651b1cf9SStefano Zampini } 4661651b1cf9SStefano Zampini } 46620d88f7f4SJunchao Zhang } 46631c265611SJunchao Zhang // sort by columns in a row. perm[] indicates their original order 46640d88f7f4SJunchao Zhang if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 46658551dd9cSJunchao Zhang PetscCheck(end == start || j[end - 1] < N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "COO column index %" PetscInt_FMT " is >= the matrix column size %" PetscInt_FMT, j[end - 1], N); 4666651b1cf9SStefano Zampini 46670d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q 46680d88f7f4SJunchao Zhang for (p = start; p < end; p++, q++) { 46690d88f7f4SJunchao Zhang Aj[q] = j[p]; 46700d88f7f4SJunchao Zhang jmap[q] = 1; 46710d88f7f4SJunchao Zhang } 46726497c311SBarry Smith PetscCall(PetscIntCast(end - start, Ai + row)); 46730d88f7f4SJunchao Zhang nnz += Ai[row]; // q is already advanced 46740d88f7f4SJunchao Zhang } else { 4675394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4676394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4677651b1cf9SStefano Zampini jmap[q] = 1; /* Number of repeats of this nonzero entry */ 4678394ed5ebSJunchao Zhang Ai[row] = 1; 4679394ed5ebSJunchao Zhang nnz++; 4680394ed5ebSJunchao Zhang 4681394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4682394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4683394ed5ebSJunchao Zhang q++; 4684394ed5ebSJunchao Zhang jmap[q] = 1; 4685394ed5ebSJunchao Zhang Aj[q] = j[p]; 4686394ed5ebSJunchao Zhang Ai[row]++; 4687394ed5ebSJunchao Zhang nnz++; 4688394ed5ebSJunchao Zhang } else { 4689394ed5ebSJunchao Zhang jmap[q]++; 4690394ed5ebSJunchao Zhang } 4691394ed5ebSJunchao Zhang } 4692394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4693394ed5ebSJunchao Zhang } 46940d88f7f4SJunchao Zhang } 46950d88f7f4SJunchao Zhang 4696394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4697394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 46980d88f7f4SJunchao Zhang jmap--; // Back to the beginning of jmap[] 4699394ed5ebSJunchao Zhang jmap[0] = 0; 4700394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 47010d88f7f4SJunchao Zhang 47029f0612e4SBarry Smith if (nnz < coo_n - nneg) { /* Reallocate with actual number of unique nonzeros */ 4703394ed5ebSJunchao Zhang PetscCount *jmap_new; 4704394ed5ebSJunchao Zhang PetscInt *Aj_new; 4705394ed5ebSJunchao Zhang 47069566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 47079566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 47089566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4709394ed5ebSJunchao Zhang jmap = jmap_new; 4710394ed5ebSJunchao Zhang 47119f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscInt), (void **)&Aj_new)); 47129566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 47139f0612e4SBarry Smith PetscCall(PetscShmgetDeallocateArray((void **)&Aj)); 4714394ed5ebSJunchao Zhang Aj = Aj_new; 4715394ed5ebSJunchao Zhang } 4716394ed5ebSJunchao Zhang 4717394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4718394ed5ebSJunchao Zhang PetscCount *perm_new; 4719cbc6b225SStefano Zampini 47209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 47219566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 47229566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4723394ed5ebSJunchao Zhang perm = perm_new; 4724394ed5ebSJunchao Zhang } 4725394ed5ebSJunchao Zhang 47269566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 47279f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscScalar), (void **)&Aa)); 47289f0612e4SBarry Smith PetscCall(PetscArrayzero(Aa, nnz)); 47299566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4730394ed5ebSJunchao Zhang 4731394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 47322c4ab24aSJunchao Zhang 47332c4ab24aSJunchao Zhang // Put the COO struct in a container and then attach that to the matrix 47342c4ab24aSJunchao Zhang PetscCall(PetscMalloc1(1, &coo)); 47356497c311SBarry Smith PetscCall(PetscIntCast(nnz, &coo->nz)); 47362c4ab24aSJunchao Zhang coo->n = coo_n; 47372c4ab24aSJunchao Zhang coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again 47382c4ab24aSJunchao Zhang coo->jmap = jmap; // of length nnz+1 47392c4ab24aSJunchao Zhang coo->perm = perm; 474003e76207SPierre Jolivet PetscCall(PetscObjectContainerCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", coo, MatCOOStructDestroy_SeqAIJ)); 47413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4742394ed5ebSJunchao Zhang } 4743394ed5ebSJunchao Zhang 4744d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4745d71ae5a4SJacob Faibussowitsch { 4746394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4747394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 47482c4ab24aSJunchao Zhang PetscCount *perm, *jmap; 4749394ed5ebSJunchao Zhang PetscScalar *Aa; 47502c4ab24aSJunchao Zhang PetscContainer container; 47512c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 4752394ed5ebSJunchao Zhang 4753394ed5ebSJunchao Zhang PetscFunctionBegin; 47542c4ab24aSJunchao Zhang PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container)); 47552c4ab24aSJunchao Zhang PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix"); 47562c4ab24aSJunchao Zhang PetscCall(PetscContainerGetPointer(container, (void **)&coo)); 47572c4ab24aSJunchao Zhang perm = coo->perm; 47582c4ab24aSJunchao Zhang jmap = coo->jmap; 47599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4760394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4761b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4762b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4763b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4764394ed5ebSJunchao Zhang } 47659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 47663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4767394ed5ebSJunchao Zhang } 4768394ed5ebSJunchao Zhang 476934b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47705063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 477102fe1965SBarry Smith #endif 4772d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4773d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *); 4774d5e393b6SSuyash Tandon #endif 47753d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47765063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 47773d0639e7SStefano Zampini #endif 477802fe1965SBarry Smith 4779d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4780d71ae5a4SJacob Faibussowitsch { 4781273d9f13SBarry Smith Mat_SeqAIJ *b; 478238baddfdSBarry Smith PetscMPIInt size; 4783273d9f13SBarry Smith 4784273d9f13SBarry Smith PetscFunctionBegin; 47859566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 478608401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4787273d9f13SBarry Smith 47884dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 47892205254eSKarl Rupp 4790b0a32e0cSBarry Smith B->data = (void *)b; 4791aea10558SJacob Faibussowitsch B->ops[0] = MatOps_Values; 4792071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 47932205254eSKarl Rupp 4794f4259b30SLisandro Dalcin b->row = NULL; 4795f4259b30SLisandro Dalcin b->col = NULL; 4796f4259b30SLisandro Dalcin b->icol = NULL; 4797b810aeb4SBarry Smith b->reallocs = 0; 479836db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4799f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4800416022c9SBarry Smith b->nonew = 0; 4801f4259b30SLisandro Dalcin b->diag = NULL; 4802f4259b30SLisandro Dalcin b->solve_work = NULL; 4803f4259b30SLisandro Dalcin B->spptr = NULL; 4804f4259b30SLisandro Dalcin b->saved_values = NULL; 4805f4259b30SLisandro Dalcin b->idiag = NULL; 4806f4259b30SLisandro Dalcin b->mdiag = NULL; 4807f4259b30SLisandro Dalcin b->ssor_work = NULL; 480871f1c65dSBarry Smith b->omega = 1.0; 480971f1c65dSBarry Smith b->fshift = 0.0; 4810bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4811a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 481217ab2063SBarry Smith 48139566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4814d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 48159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 48169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4817b3866ffcSBarry Smith #endif 48189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 48199566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 48209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 48219566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 48229566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 48239566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 48249566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 48259779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 48269566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4827191b95cbSRichard Tran Mills #endif 482834b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48299566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 48309566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48319566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 483202fe1965SBarry Smith #endif 4833d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4834d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 4835d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 4836d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ)); 4837d5e393b6SSuyash Tandon #endif 48383d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 48403d0639e7SStefano Zampini #endif 48419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4842af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 48439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4844af8000cdSHong Zhang #endif 4845d1a032dbSPierre Jolivet #if defined(PETSC_HAVE_SCALAPACK) && (defined(PETSC_USE_REAL_SINGLE) || defined(PETSC_USE_REAL_DOUBLE)) 48469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4847d24d4204SJose E. Roman #endif 484863c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 48499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 48509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 485163c07aadSStefano Zampini #endif 48529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 48539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 48549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 48559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 485614e4dea2SJose E. Roman PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ)); 48579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 48589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 4859674b392bSAlexander PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetHash_C", MatResetHash_SeqAIJ)); 48609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 48619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 48629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 48639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 48649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 48669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 48679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 48689566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 48699566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 48709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 48713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 487217ab2063SBarry Smith } 487317ab2063SBarry Smith 4874b24902e0SBarry Smith /* 48753893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4876b24902e0SBarry Smith */ 4877d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4878d71ae5a4SJacob Faibussowitsch { 48792a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4880071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 488117ab2063SBarry Smith 48823a40ed3dSBarry Smith PetscFunctionBegin; 4883aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4884273d9f13SBarry Smith 4885d5f3da31SBarry Smith C->factortype = A->factortype; 4886f4259b30SLisandro Dalcin c->row = NULL; 4887f4259b30SLisandro Dalcin c->col = NULL; 4888f4259b30SLisandro Dalcin c->icol = NULL; 48896ad4291fSHong Zhang c->reallocs = 0; 489069272f91SPierre Jolivet C->assembled = A->assembled; 489117ab2063SBarry Smith 489269272f91SPierre Jolivet if (A->preallocated) { 48939566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 48949566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4895eec197d1SBarry Smith 489631fe6a7dSBarry Smith if (!A->hash_active) { 48979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 4898*418fb43bSPierre Jolivet PetscCall(PetscArraycpy(c->imax, a->imax, m)); 48999566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 4900*418fb43bSPierre Jolivet PetscCall(PetscArraycpy(c->ilen, a->ilen, m)); 490117ab2063SBarry Smith 490217ab2063SBarry Smith /* allocate the matrix space */ 4903f77e22a1SHong Zhang if (mallocmatspace) { 49049f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscScalar), (void **)&c->a)); 49059f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscInt), (void **)&c->j)); 49069f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(m + 1, sizeof(PetscInt), (void **)&c->i)); 49079566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 49089f0612e4SBarry Smith c->free_a = PETSC_TRUE; 49099f0612e4SBarry Smith c->free_ij = PETSC_TRUE; 491017ab2063SBarry Smith if (m > 0) { 49119566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4912be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 49132e5835c6SStefano Zampini const PetscScalar *aa; 49142e5835c6SStefano Zampini 49159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 49169566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 49179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 4918be6bf707SBarry Smith } else { 49199566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 492017ab2063SBarry Smith } 492108480c60SBarry Smith } 4922f77e22a1SHong Zhang } 492331fe6a7dSBarry Smith C->preallocated = PETSC_TRUE; 492431fe6a7dSBarry Smith } else { 492531fe6a7dSBarry Smith PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix"); 492631fe6a7dSBarry Smith PetscCall(MatSetUp(C)); 492731fe6a7dSBarry Smith } 492817ab2063SBarry Smith 49296ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4930416022c9SBarry Smith c->roworiented = a->roworiented; 4931416022c9SBarry Smith c->nonew = a->nonew; 4932f4259b30SLisandro Dalcin c->solve_work = NULL; 4933f4259b30SLisandro Dalcin c->saved_values = NULL; 4934f4259b30SLisandro Dalcin c->idiag = NULL; 4935f4259b30SLisandro Dalcin c->ssor_work = NULL; 4936a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 49376ad4291fSHong Zhang 4938893ad86cSHong Zhang c->rmax = a->rmax; 4939416022c9SBarry Smith c->nz = a->nz; 49408ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4941754ec7b1SSatish Balay 49426ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 49436ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4944cd6b891eSBarry Smith if (a->compressedrow.use) { 49456ad4291fSHong Zhang i = a->compressedrow.nrows; 49469566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 49479566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 49489566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 494927ea64f8SHong Zhang } else { 495027ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 49510298fd71SBarry Smith c->compressedrow.i = NULL; 49520298fd71SBarry Smith c->compressedrow.rindex = NULL; 49536ad4291fSHong Zhang } 4954ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4955e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 49564846f1f5SKris Buschelman 49579566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 495869272f91SPierre Jolivet } 49599566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 49603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 496117ab2063SBarry Smith } 496217ab2063SBarry Smith 4963d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 4964d71ae5a4SJacob Faibussowitsch { 4965b24902e0SBarry Smith PetscFunctionBegin; 49669566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 49679566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 496848a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 49699566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 49709566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 49713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4972b24902e0SBarry Smith } 4973b24902e0SBarry Smith 4974d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4975d71ae5a4SJacob Faibussowitsch { 497652f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 497752f91c60SVaclav Hapla 497852f91c60SVaclav Hapla PetscFunctionBegin; 497952f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 498052f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 4981c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 49829566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 49839566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 49849566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 498552f91c60SVaclav Hapla if (isbinary) { 49869566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 498752f91c60SVaclav Hapla } else if (ishdf5) { 498852f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 49899566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 499052f91c60SVaclav Hapla #else 499152f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 499252f91c60SVaclav Hapla #endif 499352f91c60SVaclav Hapla } else { 499498921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 499552f91c60SVaclav Hapla } 49963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 499752f91c60SVaclav Hapla } 499852f91c60SVaclav Hapla 4999d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 5000d71ae5a4SJacob Faibussowitsch { 50013ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 50023ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 5003fbdbba38SShri Abhyankar 5004fbdbba38SShri Abhyankar PetscFunctionBegin; 50059566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 5006bbead8a2SBarry Smith 50073ea6fe3dSLisandro Dalcin /* read in matrix header */ 50089566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 500908401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 50109371c9d4SSatish Balay M = header[1]; 50119371c9d4SSatish Balay N = header[2]; 50129371c9d4SSatish Balay nz = header[3]; 501308401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 501408401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 501508401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 5016fbdbba38SShri Abhyankar 50173ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 50189566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 50193ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 50203ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 50213ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 50223ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 50233ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 50249566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 50259566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 50263ea6fe3dSLisandro Dalcin 50273ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 50289566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5029aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 50303ea6fe3dSLisandro Dalcin 5031fbdbba38SShri Abhyankar /* read in row lengths */ 50329566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 50339566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 50343ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 50359371c9d4SSatish Balay sum = 0; 50369371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 503708401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 50383ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 50399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 50409566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5041aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 50423ea6fe3dSLisandro Dalcin /* store row lengths */ 50439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 50449566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5045fbdbba38SShri Abhyankar 50463ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 50479371c9d4SSatish Balay a->i[0] = 0; 50489371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 50493ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 50509566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 50513ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 50529566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5053fbdbba38SShri Abhyankar 50549566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 50559566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 50563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5057fbdbba38SShri Abhyankar } 5058fbdbba38SShri Abhyankar 5059d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5060d71ae5a4SJacob Faibussowitsch { 50617264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5062fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 50637264ac53SSatish Balay 50643a40ed3dSBarry Smith PetscFunctionBegin; 5065bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5066d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5067ca44d042SBarry Smith *flg = PETSC_FALSE; 50683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5069bcd2baecSBarry Smith } 50707264ac53SSatish Balay 50717264ac53SSatish Balay /* if the a->i are the same */ 50729566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 50733ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 50747264ac53SSatish Balay 50757264ac53SSatish Balay /* if a->j are the same */ 50769566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 50773ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 5078bcd2baecSBarry Smith 50799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5081bcd2baecSBarry Smith /* if a->a are the same */ 50829566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 50839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 50849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 50853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 50867264ac53SSatish Balay } 508736db0b34SBarry Smith 508805869f15SSatish Balay /*@ 508911a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 509036db0b34SBarry Smith provided by the user. 509136db0b34SBarry Smith 5092d083f849SBarry Smith Collective 509336db0b34SBarry Smith 509436db0b34SBarry Smith Input Parameters: 509536db0b34SBarry Smith + comm - must be an MPI communicator of size 1 509636db0b34SBarry Smith . m - number of rows 509736db0b34SBarry Smith . n - number of columns 5098483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 509936db0b34SBarry Smith . j - column indices 510036db0b34SBarry Smith - a - matrix values 510136db0b34SBarry Smith 510236db0b34SBarry Smith Output Parameter: 510336db0b34SBarry Smith . mat - the matrix 510436db0b34SBarry Smith 510536db0b34SBarry Smith Level: intermediate 510636db0b34SBarry Smith 510736db0b34SBarry Smith Notes: 51082ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 5109292fb18eSBarry Smith once the matrix is destroyed and not before 511036db0b34SBarry Smith 511136db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 511236db0b34SBarry Smith 51132ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 511436db0b34SBarry Smith 5115a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5116a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 51178eef79e4SBarry Smith as shown 51182ef1f0ffSBarry Smith .vb 51192ef1f0ffSBarry Smith 1 0 0 51202ef1f0ffSBarry Smith 2 0 3 51212ef1f0ffSBarry Smith 4 5 6 5122a4552177SSatish Balay 51232ef1f0ffSBarry Smith i = {0,1,3,6} [size = nrow+1 = 3+1] 51242ef1f0ffSBarry Smith j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 51252ef1f0ffSBarry Smith v = {1,2,3,4,5,6} [size = 6] 51262ef1f0ffSBarry Smith .ve 5127a4552177SSatish Balay 51281cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 512936db0b34SBarry Smith @*/ 5130d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5131d71ae5a4SJacob Faibussowitsch { 5132cbcfb4deSHong Zhang PetscInt ii; 513336db0b34SBarry Smith Mat_SeqAIJ *aij; 5134cbcfb4deSHong Zhang PetscInt jj; 513536db0b34SBarry Smith 513636db0b34SBarry Smith PetscFunctionBegin; 5137aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 51389566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51399566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51409566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 51419566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5143ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 51449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 51459566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5146ab93d7beSBarry Smith 514736db0b34SBarry Smith aij->i = i; 514836db0b34SBarry Smith aij->j = j; 514936db0b34SBarry Smith aij->a = a; 515036db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5151e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5152e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 515336db0b34SBarry Smith 5154cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 515536db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 515676bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5157aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 51589985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 515908401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 516008401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 51619985e31cSBarry Smith } 516236db0b34SBarry Smith } 516376bd3646SJed Brown } 516476bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 516536db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 516608401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5167da0802e2SStefano Zampini PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1); 516836db0b34SBarry Smith } 516976bd3646SJed Brown } 517036db0b34SBarry Smith 51719566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 51729566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 51733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 517436db0b34SBarry Smith } 5175cbc6b225SStefano Zampini 5176f62e3866SBarry Smith /*@ 517711a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 51788a0b0e6bSVictor Minden provided by the user. 51798a0b0e6bSVictor Minden 5180d083f849SBarry Smith Collective 51818a0b0e6bSVictor Minden 51828a0b0e6bSVictor Minden Input Parameters: 51838a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 51848a0b0e6bSVictor Minden . m - number of rows 51858a0b0e6bSVictor Minden . n - number of columns 51868a0b0e6bSVictor Minden . i - row indices 51878a0b0e6bSVictor Minden . j - column indices 51881230e6d1SVictor Minden . a - matrix values 51891230e6d1SVictor Minden . nz - number of nonzeros 51902ef1f0ffSBarry Smith - idx - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 51918a0b0e6bSVictor Minden 51928a0b0e6bSVictor Minden Output Parameter: 51938a0b0e6bSVictor Minden . mat - the matrix 51948a0b0e6bSVictor Minden 51958a0b0e6bSVictor Minden Level: intermediate 51968a0b0e6bSVictor Minden 5197f62e3866SBarry Smith Example: 5198f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 51999e99939fSJunchao Zhang .vb 52008a0b0e6bSVictor Minden 1 0 0 52018a0b0e6bSVictor Minden 2 0 3 52028a0b0e6bSVictor Minden 4 5 6 52038a0b0e6bSVictor Minden 52048a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 52058a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 52068a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 52079e99939fSJunchao Zhang .ve 5208fe59aa6dSJacob Faibussowitsch 52092ef1f0ffSBarry Smith Note: 5210d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5211d7547e51SJunchao Zhang and are particularly useful in iterative applications. 52128a0b0e6bSVictor Minden 52131cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 52148a0b0e6bSVictor Minden @*/ 5215ce78bad3SBarry Smith PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscCount nz, PetscBool idx) 5216d71ae5a4SJacob Faibussowitsch { 5217d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 52188a0b0e6bSVictor Minden 52198a0b0e6bSVictor Minden PetscFunctionBegin; 52209566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5221ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 52229566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 52239566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 52249566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 52259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 52261230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 52271230e6d1SVictor Minden if (idx) { 52281230e6d1SVictor Minden row = i[ii] - 1; 52291230e6d1SVictor Minden col = j[ii] - 1; 52301230e6d1SVictor Minden } else { 52311230e6d1SVictor Minden row = i[ii]; 52321230e6d1SVictor Minden col = j[ii]; 52338a0b0e6bSVictor Minden } 52349566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 52358a0b0e6bSVictor Minden } 52369566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52379566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52389566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 52393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52408a0b0e6bSVictor Minden } 524136db0b34SBarry Smith 5242d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5243d71ae5a4SJacob Faibussowitsch { 52449c8f2541SHong Zhang PetscFunctionBegin; 52459566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 52463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52479c8f2541SHong Zhang } 52489c8f2541SHong Zhang 524981824310SBarry Smith /* 525053dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 525153dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 525253dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 525353dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 525453dd7562SDmitry Karpeev */ 5255d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5256d71ae5a4SJacob Faibussowitsch { 525753dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 525853dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 525953dd7562SDmitry Karpeev PetscBool seqaij; 526053dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 526153dd7562SDmitry Karpeev PetscScalar v; 526253dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 526353dd7562SDmitry Karpeev 526453dd7562SDmitry Karpeev PetscFunctionBegin; 52653ba16761SJacob Faibussowitsch if (!B) PetscFunctionReturn(PETSC_SUCCESS); 526653dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 52679566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 526828b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 526953dd7562SDmitry Karpeev if (rowemb) { 52709566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 527108401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 527253dd7562SDmitry Karpeev } else { 527308401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 527453dd7562SDmitry Karpeev } 527553dd7562SDmitry Karpeev if (colemb) { 52769566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 527708401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 527853dd7562SDmitry Karpeev } else { 527908401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 528053dd7562SDmitry Karpeev } 528153dd7562SDmitry Karpeev 5282f4f49eeaSPierre Jolivet Baij = (Mat_SeqAIJ *)B->data; 528353dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 52849566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5285ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 52869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 52879566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 528853dd7562SDmitry Karpeev } 528948a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 529053dd7562SDmitry Karpeev count = 0; 529153dd7562SDmitry Karpeev rowindices = NULL; 529253dd7562SDmitry Karpeev colindices = NULL; 529348a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 529448a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 529553dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 529653dd7562SDmitry Karpeev PetscInt row; 529753dd7562SDmitry Karpeev row = i; 529853dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 529953dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 530053dd7562SDmitry Karpeev PetscInt col; 530153dd7562SDmitry Karpeev col = Baij->j[count]; 530253dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 530353dd7562SDmitry Karpeev v = Baij->a[count]; 53049566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 530553dd7562SDmitry Karpeev ++count; 530653dd7562SDmitry Karpeev } 530753dd7562SDmitry Karpeev } 530853dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 530953dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 531053dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 531153dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 531253dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 53133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 531453dd7562SDmitry Karpeev } 531553dd7562SDmitry Karpeev 531658c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep) 5317dec0b466SHong Zhang { 5318dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5319dec0b466SHong Zhang MatScalar *aa = a->a; 5320dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5321dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5322dec0b466SHong Zhang 5323dec0b466SHong Zhang PetscFunctionBegin; 5324dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5325dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5326dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5327dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5328dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 532958c11ad4SPierre Jolivet if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++; 5330dec0b466SHong Zhang else { 5331dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5332dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5333dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5334dec0b466SHong Zhang } 5335dec0b466SHong Zhang } 5336dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5337dec0b466SHong Zhang fshift_prev = fshift; 5338dec0b466SHong Zhang /* reset ilen and imax for each row */ 5339dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5340dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5341dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5342dec0b466SHong Zhang } 5343312eded4SPierre Jolivet if (fshift) { 5344dec0b466SHong Zhang if (m) { 5345dec0b466SHong Zhang ai[m] -= fshift; 5346dec0b466SHong Zhang a->nz = ai[m]; 5347dec0b466SHong Zhang } 5348dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5349312eded4SPierre Jolivet A->nonzerostate++; 5350dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5351dec0b466SHong Zhang a->rmax = rmax; 5352dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5353dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5354dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 5355312eded4SPierre Jolivet } 53563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5357dec0b466SHong Zhang } 5358dec0b466SHong Zhang 53594099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 53604099cc6bSBarry Smith 5361cc4c1da9SBarry Smith /*@ 536211a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 53634099cc6bSBarry Smith 5364c3339decSBarry Smith Collective 53654099cc6bSBarry Smith 53664099cc6bSBarry Smith Input Parameters: 53674099cc6bSBarry Smith + mat - the matrix object 53684099cc6bSBarry Smith - matype - matrix type 53694099cc6bSBarry Smith 53704099cc6bSBarry Smith Options Database Key: 53714e187271SRichard Tran Mills . -mat_seqaij_type <method> - for example seqaijcrl 53724099cc6bSBarry Smith 53734099cc6bSBarry Smith Level: intermediate 53744099cc6bSBarry Smith 5375fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType` 53764099cc6bSBarry Smith @*/ 5377d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5378d71ae5a4SJacob Faibussowitsch { 53794099cc6bSBarry Smith PetscBool sametype; 53805f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 53814099cc6bSBarry Smith 53824099cc6bSBarry Smith PetscFunctionBegin; 53834099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 53849566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 53853ba16761SJacob Faibussowitsch if (sametype) PetscFunctionReturn(PETSC_SUCCESS); 53864099cc6bSBarry Smith 53879566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 53886adde796SStefano Zampini PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 53899566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 53903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53914099cc6bSBarry Smith } 53924099cc6bSBarry Smith 53934099cc6bSBarry Smith /*@C 539411a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 53954099cc6bSBarry Smith 5396cc4c1da9SBarry Smith Not Collective, No Fortran Support 53974099cc6bSBarry Smith 53984099cc6bSBarry Smith Input Parameters: 5399fe59aa6dSJacob Faibussowitsch + sname - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 54004099cc6bSBarry Smith - function - routine to convert to subtype 54014099cc6bSBarry Smith 54022ef1f0ffSBarry Smith Level: advanced 54032ef1f0ffSBarry Smith 54044099cc6bSBarry Smith Notes: 540511a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 54064099cc6bSBarry Smith 54074099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 5408b44f4de4SBarry Smith .vb 5409b44f4de4SBarry Smith -mat_seqaij_type my_mat 5410b44f4de4SBarry Smith .ve 54114099cc6bSBarry Smith 54121cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()` 54134099cc6bSBarry Smith @*/ 5414d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5415d71ae5a4SJacob Faibussowitsch { 54164099cc6bSBarry Smith PetscFunctionBegin; 54179566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 54189566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 54193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54204099cc6bSBarry Smith } 54214099cc6bSBarry Smith 54224099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 54234099cc6bSBarry Smith 54244099cc6bSBarry Smith /*@C 542511a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 54264099cc6bSBarry Smith 54274099cc6bSBarry Smith Not Collective 54284099cc6bSBarry Smith 54294099cc6bSBarry Smith Level: advanced 54304099cc6bSBarry Smith 54312ef1f0ffSBarry Smith Note: 54322ef1f0ffSBarry Smith This registers the versions of `MATSEQAIJ` for GPUs 54332ef1f0ffSBarry Smith 54341cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()` 54354099cc6bSBarry Smith @*/ 5436d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5437d71ae5a4SJacob Faibussowitsch { 54384099cc6bSBarry Smith PetscFunctionBegin; 54393ba16761SJacob Faibussowitsch if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS); 54404099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 54414099cc6bSBarry Smith 54429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 54439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 54449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 54459779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 54469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5447485f9817SRichard Tran Mills #endif 54485063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 54499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 54505063d097SStefano Zampini #endif 5451d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 5452d5e393b6SSuyash Tandon PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 5453d5e393b6SSuyash Tandon #endif 54545063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 54559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 54565063d097SStefano Zampini #endif 54574099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 54589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 54594099cc6bSBarry Smith #endif 54603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54614099cc6bSBarry Smith } 546253dd7562SDmitry Karpeev 546353dd7562SDmitry Karpeev /* 546481824310SBarry Smith Special version for direct calls from Fortran 546581824310SBarry Smith */ 546681824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 546781824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 546881824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 546981824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 547081824310SBarry Smith #endif 547181824310SBarry Smith 547281824310SBarry Smith /* Change these macros so can be used in void function */ 547398921bdaSJacob Faibussowitsch 547498921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 54759566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 54769566063dSJacob Faibussowitsch #undef PetscCall 54779371c9d4SSatish Balay #define PetscCall(...) \ 54789371c9d4SSatish Balay do { \ 54795f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 548098921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 548198921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 548298921bdaSJacob Faibussowitsch return; \ 548398921bdaSJacob Faibussowitsch } \ 548498921bdaSJacob Faibussowitsch } while (0) 548598921bdaSJacob Faibussowitsch 548698921bdaSJacob Faibussowitsch #undef SETERRQ 54879371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 54889371c9d4SSatish Balay do { \ 548998921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 549098921bdaSJacob Faibussowitsch return; \ 549198921bdaSJacob Faibussowitsch } while (0) 549281824310SBarry Smith 5493d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5494d71ae5a4SJacob Faibussowitsch { 549581824310SBarry Smith Mat A = *AA; 549681824310SBarry Smith PetscInt m = *mm, n = *nn; 549781824310SBarry Smith InsertMode is = *isis; 549881824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 549981824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 550081824310SBarry Smith PetscInt *imax, *ai, *ailen; 550181824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 550254f21887SBarry Smith MatScalar *ap, value, *aa; 5503ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5504ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 550581824310SBarry Smith 550681824310SBarry Smith PetscFunctionBegin; 55074994cf47SJed Brown MatCheckPreallocated(A, 1); 550881824310SBarry Smith imax = a->imax; 550981824310SBarry Smith ai = a->i; 551081824310SBarry Smith ailen = a->ilen; 551181824310SBarry Smith aj = a->j; 551281824310SBarry Smith aa = a->a; 551381824310SBarry Smith 551481824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 551581824310SBarry Smith row = im[k]; 551681824310SBarry Smith if (row < 0) continue; 55175f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 55189371c9d4SSatish Balay rp = aj + ai[row]; 55199371c9d4SSatish Balay ap = aa + ai[row]; 55209371c9d4SSatish Balay rmax = imax[row]; 55219371c9d4SSatish Balay nrow = ailen[row]; 552281824310SBarry Smith low = 0; 552381824310SBarry Smith high = nrow; 552481824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 552581824310SBarry Smith if (in[l] < 0) continue; 55265f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 552781824310SBarry Smith col = in[l]; 55282205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 55292205254eSKarl Rupp else value = v[k + l * m]; 55302205254eSKarl Rupp 553181824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 553281824310SBarry Smith 55332205254eSKarl Rupp if (col <= lastcol) low = 0; 55342205254eSKarl Rupp else high = nrow; 553581824310SBarry Smith lastcol = col; 553681824310SBarry Smith while (high - low > 5) { 553781824310SBarry Smith t = (low + high) / 2; 553881824310SBarry Smith if (rp[t] > col) high = t; 553981824310SBarry Smith else low = t; 554081824310SBarry Smith } 554181824310SBarry Smith for (i = low; i < high; i++) { 554281824310SBarry Smith if (rp[i] > col) break; 554381824310SBarry Smith if (rp[i] == col) { 554481824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 554581824310SBarry Smith else ap[i] = value; 554681824310SBarry Smith goto noinsert; 554781824310SBarry Smith } 554881824310SBarry Smith } 554981824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 555081824310SBarry Smith if (nonew == 1) goto noinsert; 55515f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5552fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 55539371c9d4SSatish Balay N = nrow++ - 1; 55549371c9d4SSatish Balay a->nz++; 55559371c9d4SSatish Balay high++; 555681824310SBarry Smith /* shift up all the later entries in this row */ 555781824310SBarry Smith for (ii = N; ii >= i; ii--) { 555881824310SBarry Smith rp[ii + 1] = rp[ii]; 555981824310SBarry Smith ap[ii + 1] = ap[ii]; 556081824310SBarry Smith } 556181824310SBarry Smith rp[i] = col; 556281824310SBarry Smith ap[i] = value; 556381824310SBarry Smith noinsert:; 556481824310SBarry Smith low = i + 1; 556581824310SBarry Smith } 556681824310SBarry Smith ailen[row] = nrow; 556781824310SBarry Smith } 556881824310SBarry Smith PetscFunctionReturnVoid(); 556981824310SBarry Smith } 557098921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 557198921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 557298921bdaSJacob Faibussowitsch * original definitions */ 55739566063dSJacob Faibussowitsch #undef PetscCall 557498921bdaSJacob Faibussowitsch #undef SETERRQ 5575