1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 11d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 12d71ae5a4SJacob Faibussowitsch { 134099cc6bSBarry Smith PetscBool flg; 144099cc6bSBarry Smith char type[256]; 154099cc6bSBarry Smith 164099cc6bSBarry Smith PetscFunctionBegin; 17d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 189566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 199566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 20d0609cedSBarry Smith PetscOptionsEnd(); 214099cc6bSBarry Smith PetscFunctionReturn(0); 224099cc6bSBarry Smith } 234099cc6bSBarry Smith 24d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 25d71ae5a4SJacob Faibussowitsch { 260716a85fSBarry Smith PetscInt i, m, n; 270716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 280716a85fSBarry Smith 290716a85fSBarry Smith PetscFunctionBegin; 309566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 319566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 320716a85fSBarry Smith if (type == NORM_2) { 33ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 340716a85fSBarry Smith } else if (type == NORM_1) { 35ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 360716a85fSBarry Smith } else if (type == NORM_INFINITY) { 37ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 38857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 39ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 40857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 42857cbf51SRichard Tran Mills } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 430716a85fSBarry Smith 440716a85fSBarry Smith if (type == NORM_2) { 45a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 47a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 480716a85fSBarry Smith } 490716a85fSBarry Smith PetscFunctionReturn(0); 500716a85fSBarry Smith } 510716a85fSBarry Smith 52d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 53d71ae5a4SJacob Faibussowitsch { 543a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 553a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 563a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 573a062f41SBarry Smith PetscInt *rows; 583a062f41SBarry Smith 593a062f41SBarry Smith PetscFunctionBegin; 603a062f41SBarry Smith for (i = 0; i < m; i++) { 61ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 623a062f41SBarry Smith } 639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 643a062f41SBarry Smith cnt = 0; 653a062f41SBarry Smith for (i = 0; i < m; i++) { 663a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 673a062f41SBarry Smith rows[cnt] = i; 683a062f41SBarry Smith cnt++; 693a062f41SBarry Smith } 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 723a062f41SBarry Smith PetscFunctionReturn(0); 733a062f41SBarry Smith } 743a062f41SBarry Smith 75d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 76d71ae5a4SJacob Faibussowitsch { 776ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 78fff043a9SJunchao Zhang const MatScalar *aa; 796ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 80b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 816ce1633cSBarry Smith PetscInt *rows; 826ce1633cSBarry Smith 836ce1633cSBarry Smith PetscFunctionBegin; 849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 859566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 866ce1633cSBarry Smith diag = a->diag; 876ce1633cSBarry Smith for (i = 0; i < m; i++) { 88ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 896ce1633cSBarry Smith } 909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 916ce1633cSBarry Smith cnt = 0; 926ce1633cSBarry Smith for (i = 0; i < m; i++) { 93ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 946ce1633cSBarry Smith } 95f1f41ecbSJed Brown *nrows = cnt; 96f1f41ecbSJed Brown *zrows = rows; 979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 98f1f41ecbSJed Brown PetscFunctionReturn(0); 99f1f41ecbSJed Brown } 100f1f41ecbSJed Brown 101d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 102d71ae5a4SJacob Faibussowitsch { 103f1f41ecbSJed Brown PetscInt nrows, *rows; 104f1f41ecbSJed Brown 105f1f41ecbSJed Brown PetscFunctionBegin; 1060298fd71SBarry Smith *zrows = NULL; 1079566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1089566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1096ce1633cSBarry Smith PetscFunctionReturn(0); 1106ce1633cSBarry Smith } 1116ce1633cSBarry Smith 112d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 113d71ae5a4SJacob Faibussowitsch { 114b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 115b3a44c85SBarry Smith const MatScalar *aa; 116b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 117b3a44c85SBarry Smith const PetscInt *ii; 118b3a44c85SBarry Smith PetscInt n, i, j, *rows; 119b3a44c85SBarry Smith 120b3a44c85SBarry Smith PetscFunctionBegin; 1219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 122f4259b30SLisandro Dalcin *keptrows = NULL; 123b3a44c85SBarry Smith ii = a->i; 124b3a44c85SBarry Smith for (i = 0; i < m; i++) { 125b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 126b3a44c85SBarry Smith if (!n) { 127b3a44c85SBarry Smith cnt++; 128b3a44c85SBarry Smith goto ok1; 129b3a44c85SBarry Smith } 1302e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 131b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 132b3a44c85SBarry Smith } 133b3a44c85SBarry Smith cnt++; 134b3a44c85SBarry Smith ok1:; 135b3a44c85SBarry Smith } 1362e5835c6SStefano Zampini if (!cnt) { 1379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1382e5835c6SStefano Zampini PetscFunctionReturn(0); 1392e5835c6SStefano Zampini } 1409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 141b3a44c85SBarry Smith cnt = 0; 142b3a44c85SBarry Smith for (i = 0; i < m; i++) { 143b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 144b3a44c85SBarry Smith if (!n) continue; 1452e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 146b3a44c85SBarry Smith if (aa[j] != 0.0) { 147b3a44c85SBarry Smith rows[cnt++] = i; 148b3a44c85SBarry Smith break; 149b3a44c85SBarry Smith } 150b3a44c85SBarry Smith } 151b3a44c85SBarry Smith } 1529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1539566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 154b3a44c85SBarry Smith PetscFunctionReturn(0); 155b3a44c85SBarry Smith } 156b3a44c85SBarry Smith 157d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 158d71ae5a4SJacob Faibussowitsch { 15979299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16099e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16199e65526SBarry Smith const PetscInt *diag; 1622e5835c6SStefano Zampini MatScalar *aa; 16399e65526SBarry Smith const PetscScalar *v; 164ace3abfcSBarry Smith PetscBool missing; 16579299369SBarry Smith 16679299369SBarry Smith PetscFunctionBegin; 16709f38230SBarry Smith if (Y->assembled) { 1689566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 16909f38230SBarry Smith if (!missing) { 17079299369SBarry Smith diag = aij->diag; 1719566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 17379299369SBarry Smith if (is == INSERT_VALUES) { 174ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 17579299369SBarry Smith } else { 176ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 17779299369SBarry Smith } 1789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1799566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 18079299369SBarry Smith PetscFunctionReturn(0); 18179299369SBarry Smith } 1829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 18309f38230SBarry Smith } 1849566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 18509f38230SBarry Smith PetscFunctionReturn(0); 18609f38230SBarry Smith } 18779299369SBarry Smith 188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 189d71ae5a4SJacob Faibussowitsch { 190416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19197f1f81fSBarry Smith PetscInt i, ishift; 19217ab2063SBarry Smith 1933a40ed3dSBarry Smith PetscFunctionBegin; 194f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 1953a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 196bfeeae90SHong Zhang ishift = 0; 197b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 1989566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 199bfeeae90SHong Zhang } else if (oshift == 1) { 2001a83f524SJed Brown PetscInt *tia; 201d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2023b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2041a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2051a83f524SJed Brown *ia = tia; 206ecc77c7aSBarry Smith if (ja) { 2071a83f524SJed Brown PetscInt *tja; 2089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2091a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2101a83f524SJed Brown *ja = tja; 211ecc77c7aSBarry Smith } 2126945ee14SBarry Smith } else { 213ecc77c7aSBarry Smith *ia = a->i; 214ecc77c7aSBarry Smith if (ja) *ja = a->j; 215a2ce50c7SBarry Smith } 2163a40ed3dSBarry Smith PetscFunctionReturn(0); 217a2744918SBarry Smith } 218a2744918SBarry Smith 219d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 220d71ae5a4SJacob Faibussowitsch { 2213a40ed3dSBarry Smith PetscFunctionBegin; 2223a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 223b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2249566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2259566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 226bcd2baecSBarry Smith } 2273a40ed3dSBarry Smith PetscFunctionReturn(0); 22817ab2063SBarry Smith } 22917ab2063SBarry Smith 230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 231d71ae5a4SJacob Faibussowitsch { 2323b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 233d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 23497f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2353b2fbd54SBarry Smith 2363a40ed3dSBarry Smith PetscFunctionBegin; 237899cda47SBarry Smith *nn = n; 2383a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2393b2fbd54SBarry Smith if (symmetric) { 2409566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2413b2fbd54SBarry Smith } else { 2429566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2453b2fbd54SBarry Smith jj = a->j; 246ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2473b2fbd54SBarry Smith cia[0] = oshift; 248ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2499566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2503b2fbd54SBarry Smith jj = a->j; 251a93ec695SBarry Smith for (row = 0; row < m; row++) { 252a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 253a93ec695SBarry Smith for (i = 0; i < mr; i++) { 254bfeeae90SHong Zhang col = *jj++; 2552205254eSKarl Rupp 2563b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2573b2fbd54SBarry Smith } 2583b2fbd54SBarry Smith } 2599566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2609371c9d4SSatish Balay *ia = cia; 2619371c9d4SSatish Balay *ja = cja; 2623b2fbd54SBarry Smith } 2633a40ed3dSBarry Smith PetscFunctionReturn(0); 2643b2fbd54SBarry Smith } 2653b2fbd54SBarry Smith 266d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 267d71ae5a4SJacob Faibussowitsch { 2683a40ed3dSBarry Smith PetscFunctionBegin; 2693a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2703b2fbd54SBarry Smith 2719566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2729566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2733a40ed3dSBarry Smith PetscFunctionReturn(0); 2743b2fbd54SBarry Smith } 2753b2fbd54SBarry Smith 2767cee066cSHong Zhang /* 2777cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2787cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 279040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2807cee066cSHong Zhang */ 281d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 282d71ae5a4SJacob Faibussowitsch { 2837cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2847cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 285071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2867cee066cSHong Zhang PetscInt *cspidx; 287071fcb05SBarry Smith const PetscInt *jj; 2887cee066cSHong Zhang 2897cee066cSHong Zhang PetscFunctionBegin; 2907cee066cSHong Zhang *nn = n; 2917cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 292625f6d37SHong Zhang 2939566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2959566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2969566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 2977cee066cSHong Zhang jj = a->j; 298ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2997cee066cSHong Zhang cia[0] = oshift; 300ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3019566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3027cee066cSHong Zhang jj = a->j; 3037cee066cSHong Zhang for (row = 0; row < m; row++) { 3047cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3057cee066cSHong Zhang for (i = 0; i < mr; i++) { 3067cee066cSHong Zhang col = *jj++; 307071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 308071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 309071fcb05SBarry Smith cja[tmp] = row + oshift; 3107cee066cSHong Zhang } 3117cee066cSHong Zhang } 3129566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 313071fcb05SBarry Smith *ia = cia; 314071fcb05SBarry Smith *ja = cja; 3157cee066cSHong Zhang *spidx = cspidx; 3167cee066cSHong Zhang PetscFunctionReturn(0); 3177cee066cSHong Zhang } 3187cee066cSHong Zhang 319d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 320d71ae5a4SJacob Faibussowitsch { 3217cee066cSHong Zhang PetscFunctionBegin; 3229566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3239566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3247cee066cSHong Zhang PetscFunctionReturn(0); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 328d71ae5a4SJacob Faibussowitsch { 32987d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33087d4246cSBarry Smith PetscInt *ai = a->i; 331fff043a9SJunchao Zhang PetscScalar *aa; 33287d4246cSBarry Smith 33387d4246cSBarry Smith PetscFunctionBegin; 3349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3359566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 33787d4246cSBarry Smith PetscFunctionReturn(0); 33887d4246cSBarry Smith } 33987d4246cSBarry Smith 340bd04181cSBarry Smith /* 341bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 342bd04181cSBarry Smith 343bd04181cSBarry Smith - a single row of values is set with each call 344bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 345bd04181cSBarry Smith - the values are always added to the matrix, not set 346bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 347bd04181cSBarry Smith 3481f763a69SBarry Smith This does NOT assume the global column indices are sorted 349bd04181cSBarry Smith 3501f763a69SBarry Smith */ 351bd04181cSBarry Smith 352af0996ceSBarry Smith #include <petsc/private/isimpl.h> 353d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 354d71ae5a4SJacob Faibussowitsch { 355189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3561f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3571f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3581f763a69SBarry Smith PetscInt lastcol = -1; 359fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 360189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 361189e4007SBarry Smith 362fff043a9SJunchao Zhang PetscFunctionBegin; 3639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 364f38dd0b8SBarry Smith row = ridx[im[0]]; 3651f763a69SBarry Smith rp = aj + ai[row]; 3661f763a69SBarry Smith ap = aa + ai[row]; 3671f763a69SBarry Smith nrow = ailen[row]; 368189e4007SBarry Smith low = 0; 369189e4007SBarry Smith high = nrow; 370189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 371189e4007SBarry Smith col = cidx[in[l]]; 372f38dd0b8SBarry Smith value = v[l]; 373189e4007SBarry Smith 374189e4007SBarry Smith if (col <= lastcol) low = 0; 375189e4007SBarry Smith else high = nrow; 376189e4007SBarry Smith lastcol = col; 377189e4007SBarry Smith while (high - low > 5) { 378189e4007SBarry Smith t = (low + high) / 2; 379189e4007SBarry Smith if (rp[t] > col) high = t; 380189e4007SBarry Smith else low = t; 381189e4007SBarry Smith } 382189e4007SBarry Smith for (i = low; i < high; i++) { 383189e4007SBarry Smith if (rp[i] == col) { 3841f763a69SBarry Smith ap[i] += value; 385189e4007SBarry Smith low = i + 1; 3861f763a69SBarry Smith break; 387189e4007SBarry Smith } 388189e4007SBarry Smith } 389189e4007SBarry Smith } 3909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 391f38dd0b8SBarry Smith return 0; 392189e4007SBarry Smith } 393189e4007SBarry Smith 394d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 395d71ae5a4SJacob Faibussowitsch { 396416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 397e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 39897f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 399e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 400ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 401ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 402ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 40317ab2063SBarry Smith 4043a40ed3dSBarry Smith PetscFunctionBegin; 4059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 40617ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 407416022c9SBarry Smith row = im[k]; 4085ef9f2a5SBarry Smith if (row < 0) continue; 4096bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 410720833daSHong Zhang rp = aj + ai[row]; 411876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 4129371c9d4SSatish Balay rmax = imax[row]; 4139371c9d4SSatish Balay nrow = ailen[row]; 414416022c9SBarry Smith low = 0; 415c71e6ed7SBarry Smith high = nrow; 41617ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4175ef9f2a5SBarry Smith if (in[l] < 0) continue; 4186bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 419bfeeae90SHong Zhang col = in[l]; 420071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 421071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 42236db0b34SBarry Smith 4232205254eSKarl Rupp if (col <= lastcol) low = 0; 4242205254eSKarl Rupp else high = nrow; 425e2ee6c50SBarry Smith lastcol = col; 426416022c9SBarry Smith while (high - low > 5) { 427416022c9SBarry Smith t = (low + high) / 2; 428416022c9SBarry Smith if (rp[t] > col) high = t; 429416022c9SBarry Smith else low = t; 43017ab2063SBarry Smith } 431416022c9SBarry Smith for (i = low; i < high; i++) { 43217ab2063SBarry Smith if (rp[i] > col) break; 43317ab2063SBarry Smith if (rp[i] == col) { 434876c6284SHong Zhang if (!A->structure_only) { 4350c0d7e18SFande Kong if (is == ADD_VALUES) { 4360c0d7e18SFande Kong ap[i] += value; 4370c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4389371c9d4SSatish Balay } else ap[i] = value; 439720833daSHong Zhang } 440e44c0bd4SBarry Smith low = i + 1; 44117ab2063SBarry Smith goto noinsert; 44217ab2063SBarry Smith } 44317ab2063SBarry Smith } 444dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 445c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 44608401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 447720833daSHong Zhang if (A->structure_only) { 448876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 449720833daSHong Zhang } else { 450fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 451720833daSHong Zhang } 4529371c9d4SSatish Balay N = nrow++ - 1; 4539371c9d4SSatish Balay a->nz++; 4549371c9d4SSatish Balay high++; 455416022c9SBarry Smith /* shift up all the later entries in this row */ 4569566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 45717ab2063SBarry Smith rp[i] = col; 458580bdb30SBarry Smith if (!A->structure_only) { 4599566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 460580bdb30SBarry Smith ap[i] = value; 461580bdb30SBarry Smith } 462416022c9SBarry Smith low = i + 1; 463e56f5c9eSBarry Smith A->nonzerostate++; 464e44c0bd4SBarry Smith noinsert:; 46517ab2063SBarry Smith } 46617ab2063SBarry Smith ailen[row] = nrow; 46717ab2063SBarry Smith } 4689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4693a40ed3dSBarry Smith PetscFunctionReturn(0); 47017ab2063SBarry Smith } 47117ab2063SBarry Smith 472d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 473d71ae5a4SJacob Faibussowitsch { 47419b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 47519b08ed1SBarry Smith PetscInt *rp, k, row; 47619b08ed1SBarry Smith PetscInt *ai = a->i; 47719b08ed1SBarry Smith PetscInt *aj = a->j; 478fff043a9SJunchao Zhang MatScalar *aa, *ap; 47919b08ed1SBarry Smith 48019b08ed1SBarry Smith PetscFunctionBegin; 48128b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 48208401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 483fff043a9SJunchao Zhang 4849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 48519b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 48619b08ed1SBarry Smith row = im[k]; 48719b08ed1SBarry Smith rp = aj + ai[row]; 48819b08ed1SBarry Smith ap = aa + ai[row]; 48919b08ed1SBarry Smith 4909566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49119b08ed1SBarry Smith if (!A->structure_only) { 49219b08ed1SBarry Smith if (v) { 4939566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 49419b08ed1SBarry Smith v += n; 49519b08ed1SBarry Smith } else { 4969566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 49719b08ed1SBarry Smith } 49819b08ed1SBarry Smith } 49919b08ed1SBarry Smith a->ilen[row] = n; 50019b08ed1SBarry Smith a->imax[row] = n; 50119b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 50219b08ed1SBarry Smith a->nz += n; 50319b08ed1SBarry Smith } 5049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 50519b08ed1SBarry Smith PetscFunctionReturn(0); 50619b08ed1SBarry Smith } 50719b08ed1SBarry Smith 50819b08ed1SBarry Smith /*@ 50919b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51019b08ed1SBarry Smith 51119b08ed1SBarry Smith Input Parameters: 51211a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 51319b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 51419b08ed1SBarry Smith 51519b08ed1SBarry Smith Level: advanced 51619b08ed1SBarry Smith 51719b08ed1SBarry Smith Notes: 51819b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 51911a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52019b08ed1SBarry Smith as always with multiple matrix assemblies. 52119b08ed1SBarry Smith 522db781477SPatrick Sanan .seealso: `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 52319b08ed1SBarry Smith @*/ 52419b08ed1SBarry Smith 525d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 526d71ae5a4SJacob Faibussowitsch { 52719b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 52819b08ed1SBarry Smith 52919b08ed1SBarry Smith PetscFunctionBegin; 5309566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5319566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53219b08ed1SBarry Smith a->maxnz = nztotal; 5334dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 53419b08ed1SBarry Smith if (!a->ilen) { 5359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 53619b08ed1SBarry Smith } else { 5379566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 53819b08ed1SBarry Smith } 53919b08ed1SBarry Smith 54019b08ed1SBarry Smith /* allocate the matrix space */ 54119b08ed1SBarry Smith if (A->structure_only) { 5429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal, &a->j)); 5439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i)); 54419b08ed1SBarry Smith } else { 5459566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i)); 54619b08ed1SBarry Smith } 54719b08ed1SBarry Smith a->i[0] = 0; 54819b08ed1SBarry Smith if (A->structure_only) { 54919b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 55019b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55119b08ed1SBarry Smith } else { 55219b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 55319b08ed1SBarry Smith a->free_a = PETSC_TRUE; 55419b08ed1SBarry Smith } 55519b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 55619b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 55719b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 55819b08ed1SBarry Smith PetscFunctionReturn(0); 55919b08ed1SBarry Smith } 56019b08ed1SBarry Smith 561d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 562d71ae5a4SJacob Faibussowitsch { 563071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 564071fcb05SBarry Smith PetscInt *rp, k, row; 565071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 566071fcb05SBarry Smith PetscInt *aj = a->j; 567fff043a9SJunchao Zhang MatScalar *aa, *ap; 568071fcb05SBarry Smith 569071fcb05SBarry Smith PetscFunctionBegin; 5709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 571071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 572071fcb05SBarry Smith row = im[k]; 5736bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 574071fcb05SBarry Smith rp = aj + ai[row]; 575071fcb05SBarry Smith ap = aa + ai[row]; 57648a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 577071fcb05SBarry Smith if (!A->structure_only) { 578071fcb05SBarry Smith if (v) { 5799566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 580071fcb05SBarry Smith v += n; 581071fcb05SBarry Smith } else { 5829566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 583071fcb05SBarry Smith } 584071fcb05SBarry Smith } 585071fcb05SBarry Smith ailen[row] = n; 586071fcb05SBarry Smith a->nz += n; 587071fcb05SBarry Smith } 5889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 589071fcb05SBarry Smith PetscFunctionReturn(0); 590071fcb05SBarry Smith } 591071fcb05SBarry Smith 592d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 593d71ae5a4SJacob Faibussowitsch { 5947eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 59597f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59697f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 5974e208921SJed Brown const MatScalar *ap, *aa; 5987eb43aa7SLois Curfman McInnes 5993a40ed3dSBarry Smith PetscFunctionBegin; 6004e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6017eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6027eb43aa7SLois Curfman McInnes row = im[k]; 6039371c9d4SSatish Balay if (row < 0) { 6049371c9d4SSatish Balay v += n; 6059371c9d4SSatish Balay continue; 6069371c9d4SSatish Balay } /* negative row */ 60754c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6089371c9d4SSatish Balay rp = aj + ai[row]; 6099371c9d4SSatish Balay ap = aa + ai[row]; 6107eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6117eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6129371c9d4SSatish Balay if (in[l] < 0) { 6139371c9d4SSatish Balay v++; 6149371c9d4SSatish Balay continue; 6159371c9d4SSatish Balay } /* negative column */ 61654c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 617bfeeae90SHong Zhang col = in[l]; 6189371c9d4SSatish Balay high = nrow; 6199371c9d4SSatish Balay low = 0; /* assume unsorted */ 6207eb43aa7SLois Curfman McInnes while (high - low > 5) { 6217eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6227eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6237eb43aa7SLois Curfman McInnes else low = t; 6247eb43aa7SLois Curfman McInnes } 6257eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6267eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6277eb43aa7SLois Curfman McInnes if (rp[i] == col) { 628b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6297eb43aa7SLois Curfman McInnes goto finished; 6307eb43aa7SLois Curfman McInnes } 6317eb43aa7SLois Curfman McInnes } 63297e567efSBarry Smith *v++ = 0.0; 6337eb43aa7SLois Curfman McInnes finished:; 6347eb43aa7SLois Curfman McInnes } 6357eb43aa7SLois Curfman McInnes } 6364e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6373a40ed3dSBarry Smith PetscFunctionReturn(0); 6387eb43aa7SLois Curfman McInnes } 6397eb43aa7SLois Curfman McInnes 640d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 641d71ae5a4SJacob Faibussowitsch { 6423ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 643c898d852SStefano Zampini const PetscScalar *av; 6443ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6453ea6fe3dSLisandro Dalcin PetscInt *rowlens; 64617ab2063SBarry Smith 6473a40ed3dSBarry Smith PetscFunctionBegin; 6489566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6492205254eSKarl Rupp 6503ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6513ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6523ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6533ea6fe3dSLisandro Dalcin nz = A->nz; 654416022c9SBarry Smith 6553ea6fe3dSLisandro Dalcin /* write matrix header */ 6563ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6579371c9d4SSatish Balay header[1] = M; 6589371c9d4SSatish Balay header[2] = N; 6599371c9d4SSatish Balay header[3] = nz; 6609566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 661416022c9SBarry Smith 6623ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6643ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6659566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6669566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6673ea6fe3dSLisandro Dalcin /* store column indices */ 6689566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 669416022c9SBarry Smith /* store nonzero values */ 6709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6719566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 673b37d52dbSMark F. Adams 6743ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6759566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6763a40ed3dSBarry Smith PetscFunctionReturn(0); 67717ab2063SBarry Smith } 678416022c9SBarry Smith 679d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 680d71ae5a4SJacob Faibussowitsch { 6817dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6827dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6837dc0baabSHong Zhang 6847dc0baabSHong Zhang PetscFunctionBegin; 6859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6867dc0baabSHong Zhang for (i = 0; i < m; i++) { 6879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 68848a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6907dc0baabSHong Zhang } 6919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6927dc0baabSHong Zhang PetscFunctionReturn(0); 6937dc0baabSHong Zhang } 6947dc0baabSHong Zhang 69509573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 696cd155464SBarry Smith 697d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 698d71ae5a4SJacob Faibussowitsch { 699416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 700c898d852SStefano Zampini const PetscScalar *av; 70160e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 702e060cb09SBarry Smith const char *name; 703f3ef73ceSBarry Smith PetscViewerFormat format; 70417ab2063SBarry Smith 7053a40ed3dSBarry Smith PetscFunctionBegin; 7067dc0baabSHong Zhang if (A->structure_only) { 7079566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7087dc0baabSHong Zhang PetscFunctionReturn(0); 7097dc0baabSHong Zhang } 71043e49210SHong Zhang 7119566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 7122e5835c6SStefano Zampini if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 7132e5835c6SStefano Zampini 714c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 71771c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 71897f1f81fSBarry Smith PetscInt nofinalvalue = 0; 71960e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 720c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 721d00d2cf4SBarry Smith nofinalvalue = 1; 722d00d2cf4SBarry Smith } 7239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 726fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 728fbfe6fa7SJed Brown #else 7299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 730fbfe6fa7SJed Brown #endif 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73217ab2063SBarry Smith 73317ab2063SBarry Smith for (i = 0; i < m; i++) { 73460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 735aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 73717ab2063SBarry Smith #else 7389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 73917ab2063SBarry Smith #endif 74017ab2063SBarry Smith } 74117ab2063SBarry Smith } 742d00d2cf4SBarry Smith if (nofinalvalue) { 743c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 745c337ccceSJed Brown #else 7469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 747c337ccceSJed Brown #endif 748d00d2cf4SBarry Smith } 7499566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 752fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 75444cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 75660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 757aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 75836db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76036db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76236db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7646831982aSBarry Smith } 76544cd7ae7SLois Curfman McInnes #else 7669566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 76744cd7ae7SLois Curfman McInnes #endif 76844cd7ae7SLois Curfman McInnes } 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77044cd7ae7SLois Curfman McInnes } 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 772fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 77397f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 776496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 777496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 77860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 779496be53dSLois Curfman McInnes if (a->j[j] >= i) { 780aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78136db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 782496be53dSLois Curfman McInnes #else 783496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 784496be53dSLois Curfman McInnes #endif 785496be53dSLois Curfman McInnes } 786496be53dSLois Curfman McInnes } 787496be53dSLois Curfman McInnes } 7882e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7902e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7912205254eSKarl Rupp if (i + 4 < m) { 7929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 7932205254eSKarl Rupp } else if (i + 3 < m) { 7949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 7952205254eSKarl Rupp } else if (i + 2 < m) { 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 7972205254eSKarl Rupp } else if (i + 1 < m) { 7989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 7992205254eSKarl Rupp } else if (i < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8012205254eSKarl Rupp } else { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8032205254eSKarl Rupp } 804496be53dSLois Curfman McInnes } 8059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8069566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 807496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 80860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8099566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 810496be53dSLois Curfman McInnes } 8119566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 812496be53dSLois Curfman McInnes } 8139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 814496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 816496be53dSLois Curfman McInnes if (a->j[j] >= i) { 817aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 81848a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 819496be53dSLois Curfman McInnes #else 8209566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 821496be53dSLois Curfman McInnes #endif 822496be53dSLois Curfman McInnes } 823496be53dSLois Curfman McInnes } 8249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 825496be53dSLois Curfman McInnes } 8269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 827fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 82897f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 82987828ca2SBarry Smith PetscScalar value; 83068f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83168f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83268f1ed48SBarry Smith 83368f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 83468f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 83568f1ed48SBarry Smith realonly = PETSC_FALSE; 83668f1ed48SBarry Smith break; 83768f1ed48SBarry Smith } 83868f1ed48SBarry Smith } 83968f1ed48SBarry Smith #endif 84002594712SBarry Smith 8419566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84202594712SBarry Smith for (i = 0; i < m; i++) { 84302594712SBarry Smith jcnt = 0; 844d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 845e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 84602594712SBarry Smith value = a->a[cnt++]; 847e24b481bSBarry Smith jcnt++; 84802594712SBarry Smith } else { 84902594712SBarry Smith value = 0.0; 85002594712SBarry Smith } 851aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85268f1ed48SBarry Smith if (realonly) { 8539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 85468f1ed48SBarry Smith } else { 8559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 85668f1ed48SBarry Smith } 85702594712SBarry Smith #else 8589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 85902594712SBarry Smith #endif 86002594712SBarry Smith } 8619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86202594712SBarry Smith } 8639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8643c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 865150b93efSMatthew G. Knepley PetscInt fshift = 1; 8669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8673c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8693c215bfdSMatthew Knepley #else 8709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8713c215bfdSMatthew Knepley #endif 8729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8733c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 87460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8773c215bfdSMatthew Knepley #else 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8793c215bfdSMatthew Knepley #endif 8803c215bfdSMatthew Knepley } 8813c215bfdSMatthew Knepley } 8829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8833a40ed3dSBarry Smith } else { 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 885d5f3da31SBarry Smith if (A->factortype) { 88616cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 88816cd7e1dSShri Abhyankar /* L part */ 88960e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89116cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 89316cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 89516cd7e1dSShri Abhyankar } else { 8969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 89716cd7e1dSShri Abhyankar } 89816cd7e1dSShri Abhyankar #else 8999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90016cd7e1dSShri Abhyankar #endif 90116cd7e1dSShri Abhyankar } 90216cd7e1dSShri Abhyankar /* diagonal */ 90316cd7e1dSShri Abhyankar j = a->diag[i]; 90416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 90516cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 90716cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 90916cd7e1dSShri Abhyankar } else { 9109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91116cd7e1dSShri Abhyankar } 91216cd7e1dSShri Abhyankar #else 9139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 91416cd7e1dSShri Abhyankar #endif 91516cd7e1dSShri Abhyankar 91616cd7e1dSShri Abhyankar /* U part */ 91760e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 91816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9229566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 92316cd7e1dSShri Abhyankar } else { 9249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 92516cd7e1dSShri Abhyankar } 92616cd7e1dSShri Abhyankar #else 9279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 92816cd7e1dSShri Abhyankar #endif 92916cd7e1dSShri Abhyankar } 9309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93116cd7e1dSShri Abhyankar } 93216cd7e1dSShri Abhyankar } else { 93317ab2063SBarry Smith for (i = 0; i < m; i++) { 9349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 93560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 936aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 93736db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 93936db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9413a40ed3dSBarry Smith } else { 9429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 94317ab2063SBarry Smith } 94417ab2063SBarry Smith #else 9459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 94617ab2063SBarry Smith #endif 94717ab2063SBarry Smith } 9489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 94917ab2063SBarry Smith } 95016cd7e1dSShri Abhyankar } 9519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95217ab2063SBarry Smith } 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9543a40ed3dSBarry Smith PetscFunctionReturn(0); 955416022c9SBarry Smith } 956416022c9SBarry Smith 9579804daf3SBarry Smith #include <petscdraw.h> 958d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 959d71ae5a4SJacob Faibussowitsch { 960480ef9eaSBarry Smith Mat A = (Mat)Aa; 961416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 962383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 963383922c3SLisandro Dalcin int color; 964b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 965b0a32e0cSBarry Smith PetscViewer viewer; 966f3ef73ceSBarry Smith PetscViewerFormat format; 967fff043a9SJunchao Zhang const PetscScalar *aa; 968cddf8d76SBarry Smith 9693a40ed3dSBarry Smith PetscFunctionBegin; 9709566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9719566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9729566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 973383922c3SLisandro Dalcin 974416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 976fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 977d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9780513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 979b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 980416022c9SBarry Smith for (i = 0; i < m; i++) { 9819371c9d4SSatish Balay y_l = m - i - 1.0; 9829371c9d4SSatish Balay y_r = y_l + 1.0; 983bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9849371c9d4SSatish Balay x_l = a->j[j]; 9859371c9d4SSatish Balay x_r = x_l + 1.0; 986fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9879566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 988cddf8d76SBarry Smith } 989cddf8d76SBarry Smith } 990b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 991cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9929371c9d4SSatish Balay y_l = m - i - 1.0; 9939371c9d4SSatish Balay y_r = y_l + 1.0; 994bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9959371c9d4SSatish Balay x_l = a->j[j]; 9969371c9d4SSatish Balay x_r = x_l + 1.0; 997fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 9989566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 999cddf8d76SBarry Smith } 1000cddf8d76SBarry Smith } 1001b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1002cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10039371c9d4SSatish Balay y_l = m - i - 1.0; 10049371c9d4SSatish Balay y_r = y_l + 1.0; 1005bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10069371c9d4SSatish Balay x_l = a->j[j]; 10079371c9d4SSatish Balay x_r = x_l + 1.0; 1008fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10099566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1010416022c9SBarry Smith } 1011416022c9SBarry Smith } 1012d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10130513a670SBarry Smith } else { 10140513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10150513a670SBarry Smith /* first determine max of all nonzero values */ 1016b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1017383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1018b0a32e0cSBarry Smith PetscDraw popup; 10190513a670SBarry Smith 10200513a670SBarry Smith for (i = 0; i < nz; i++) { 1021fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10220513a670SBarry Smith } 1023383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10249566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10259566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1026383922c3SLisandro Dalcin 1027d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10280513a670SBarry Smith for (i = 0; i < m; i++) { 1029383922c3SLisandro Dalcin y_l = m - i - 1.0; 1030383922c3SLisandro Dalcin y_r = y_l + 1.0; 1031bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1032383922c3SLisandro Dalcin x_l = a->j[j]; 1033383922c3SLisandro Dalcin x_r = x_l + 1.0; 1034fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10359566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10360513a670SBarry Smith count++; 10370513a670SBarry Smith } 10380513a670SBarry Smith } 1039d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10400513a670SBarry Smith } 10419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1042480ef9eaSBarry Smith PetscFunctionReturn(0); 1043480ef9eaSBarry Smith } 1044cddf8d76SBarry Smith 10459804daf3SBarry Smith #include <petscdraw.h> 1046d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1047d71ae5a4SJacob Faibussowitsch { 1048b0a32e0cSBarry Smith PetscDraw draw; 104936db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1050ace3abfcSBarry Smith PetscBool isnull; 1051480ef9eaSBarry Smith 1052480ef9eaSBarry Smith PetscFunctionBegin; 10539566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10549566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 1055480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 1056480ef9eaSBarry Smith 10579371c9d4SSatish Balay xr = A->cmap->n; 10589371c9d4SSatish Balay yr = A->rmap->n; 10599371c9d4SSatish Balay h = yr / 10.0; 10609371c9d4SSatish Balay w = xr / 10.0; 10619371c9d4SSatish Balay xr += w; 10629371c9d4SSatish Balay yr += h; 10639371c9d4SSatish Balay xl = -w; 10649371c9d4SSatish Balay yl = -h; 10659566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10669566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10679566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10689566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10699566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10703a40ed3dSBarry Smith PetscFunctionReturn(0); 1071416022c9SBarry Smith } 1072416022c9SBarry Smith 1073d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1074d71ae5a4SJacob Faibussowitsch { 1075ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1076416022c9SBarry Smith 10773a40ed3dSBarry Smith PetscFunctionBegin; 10789566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10799566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10809566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10811baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10821baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10831baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10849566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10853a40ed3dSBarry Smith PetscFunctionReturn(0); 108617ab2063SBarry Smith } 108719bcc07fSBarry Smith 1088d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1089d71ae5a4SJacob Faibussowitsch { 1090416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1091580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1092d0f46423SBarry Smith PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0; 109354f21887SBarry Smith MatScalar *aa = a->a, *ap; 10943447b6efSHong Zhang PetscReal ratio = 0.6; 109517ab2063SBarry Smith 10963a40ed3dSBarry Smith PetscFunctionBegin; 10973a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 10989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1099b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1100b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11019566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 1102b215bc84SStefano Zampini PetscFunctionReturn(0); 1103b215bc84SStefano Zampini } 110417ab2063SBarry Smith 110543ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 110617ab2063SBarry Smith for (i = 1; i < m; i++) { 1107416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 110817ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 110994a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111017ab2063SBarry Smith if (fshift) { 1111bfeeae90SHong Zhang ip = aj + ai[i]; 1112bfeeae90SHong Zhang ap = aa + ai[i]; 111317ab2063SBarry Smith N = ailen[i]; 11149566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 111548a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 111617ab2063SBarry Smith } 111717ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 111817ab2063SBarry Smith } 111917ab2063SBarry Smith if (m) { 112017ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112117ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112217ab2063SBarry Smith } 112317ab2063SBarry Smith /* reset ilen and imax for each row */ 11247b083b7cSBarry Smith a->nonzerorowcnt = 0; 1125396832f4SHong Zhang if (A->structure_only) { 11269566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11279566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1128396832f4SHong Zhang } else { /* !A->structure_only */ 112917ab2063SBarry Smith for (i = 0; i < m; i++) { 113017ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11317b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113217ab2063SBarry Smith } 1133396832f4SHong Zhang } 1134bfeeae90SHong Zhang a->nz = ai[m]; 1135aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 113617ab2063SBarry Smith 11379566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 11389566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11399566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11409566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11412205254eSKarl Rupp 11428e58a170SBarry Smith A->info.mallocs += a->reallocs; 1143dd5f02e7SSatish Balay a->reallocs = 0; 11446712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 114536db0b34SBarry Smith a->rmax = rmax; 11464e220ebcSLois Curfman McInnes 114748a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11489566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11493a40ed3dSBarry Smith PetscFunctionReturn(0); 115017ab2063SBarry Smith } 115117ab2063SBarry Smith 1152d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1153d71ae5a4SJacob Faibussowitsch { 115499cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 115599cafbc1SBarry Smith PetscInt i, nz = a->nz; 11562e5835c6SStefano Zampini MatScalar *aa; 115799cafbc1SBarry Smith 115899cafbc1SBarry Smith PetscFunctionBegin; 11599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 116099cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 116399cafbc1SBarry Smith PetscFunctionReturn(0); 116499cafbc1SBarry Smith } 116599cafbc1SBarry Smith 1166d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1167d71ae5a4SJacob Faibussowitsch { 116899cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 116999cafbc1SBarry Smith PetscInt i, nz = a->nz; 11702e5835c6SStefano Zampini MatScalar *aa; 117199cafbc1SBarry Smith 117299cafbc1SBarry Smith PetscFunctionBegin; 11739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117499cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 117799cafbc1SBarry Smith PetscFunctionReturn(0); 117899cafbc1SBarry Smith } 117999cafbc1SBarry Smith 1180d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1181d71ae5a4SJacob Faibussowitsch { 1182fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1183fff043a9SJunchao Zhang MatScalar *aa; 11843a40ed3dSBarry Smith 11853a40ed3dSBarry Smith PetscFunctionBegin; 11869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 11879566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 11889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 11899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11903a40ed3dSBarry Smith PetscFunctionReturn(0); 119117ab2063SBarry Smith } 1192416022c9SBarry Smith 1193d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatResetPreallocationCOO_SeqAIJ(Mat A) 1194d71ae5a4SJacob Faibussowitsch { 1195cbc6b225SStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1196cbc6b225SStefano Zampini 1197cbc6b225SStefano Zampini PetscFunctionBegin; 11989566063dSJacob Faibussowitsch PetscCall(PetscFree(a->perm)); 11999566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jmap)); 1200cbc6b225SStefano Zampini PetscFunctionReturn(0); 1201cbc6b225SStefano Zampini } 1202cbc6b225SStefano Zampini 1203d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1204d71ae5a4SJacob Faibussowitsch { 1205416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1206d5d45c9bSBarry Smith 12073a40ed3dSBarry Smith PetscFunctionBegin; 1208aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1209c0aa6a63SJacob Faibussowitsch PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz); 121017ab2063SBarry Smith #endif 12119566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12129566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(A)); 12139566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12149566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12159566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12169566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12179566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12189566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12199566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12209566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12219566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12229566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12239566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12259566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12269566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1227901853e0SKris Buschelman 12286718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12296718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12306718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12316718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12326718818eSStefano Zampini due to different matrix sizes */ 12339566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12346718818eSStefano Zampini 12359566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12362e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12372e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12389566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12442e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12452e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12462e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12472e956fe4SStefano Zampini #endif 12484222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12524222ddf1SHong Zhang #endif 1253d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 1254d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL)); 1255d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL)); 1256d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL)); 1257d5e393b6SSuyash Tandon #endif 12583d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12603d0639e7SStefano Zampini #endif 12619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1262af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1264af8000cdSHong Zhang #endif 1265d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1267d24d4204SJose E. Roman #endif 126863c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 127163c07aadSStefano Zampini #endif 12729566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12762e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12872e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12882e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12892e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12902e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 12912e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 12922e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 12932e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 12943a40ed3dSBarry Smith PetscFunctionReturn(0); 129517ab2063SBarry Smith } 129617ab2063SBarry Smith 1297d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1298d71ae5a4SJacob Faibussowitsch { 1299416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13003a40ed3dSBarry Smith 13013a40ed3dSBarry Smith PetscFunctionBegin; 1302a65d3064SKris Buschelman switch (op) { 1303d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1304d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1305d71ae5a4SJacob Faibussowitsch break; 1306d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1307d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1308d71ae5a4SJacob Faibussowitsch break; 1309d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1310d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1311d71ae5a4SJacob Faibussowitsch break; 1312d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1313d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1314d71ae5a4SJacob Faibussowitsch break; 1315d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1316d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1317d71ae5a4SJacob Faibussowitsch break; 1318d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1319d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1320d71ae5a4SJacob Faibussowitsch break; 1321d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1322d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1323d71ae5a4SJacob Faibussowitsch break; 13243d472b54SHong Zhang case MAT_SPD: 1325b1646e73SJed Brown case MAT_SYMMETRIC: 1326b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1327b1646e73SJed Brown case MAT_HERMITIAN: 1328b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1329957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1330b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1331b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1332b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13335021d80fSJed Brown break; 13348c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1335a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1336d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1337d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1338d71ae5a4SJacob Faibussowitsch break; 1339d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1340d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1341d71ae5a4SJacob Faibussowitsch break; 1342d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1343d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1344d71ae5a4SJacob Faibussowitsch break; 1345071fcb05SBarry Smith case MAT_SORTED_FULL: 1346071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1347071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1348071fcb05SBarry Smith break; 1349d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1350d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1351d71ae5a4SJacob Faibussowitsch break; 1352d71ae5a4SJacob Faibussowitsch default: 1353d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1354a65d3064SKris Buschelman } 13553a40ed3dSBarry Smith PetscFunctionReturn(0); 135617ab2063SBarry Smith } 135717ab2063SBarry Smith 1358d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1359d71ae5a4SJacob Faibussowitsch { 1360416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1361fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1362c898d852SStefano Zampini PetscScalar *x; 1363c898d852SStefano Zampini const PetscScalar *aa; 136417ab2063SBarry Smith 13653a40ed3dSBarry Smith PetscFunctionBegin; 13669566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 136708401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1369d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1370d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13719566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13722c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13739566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 137535e7444dSHong Zhang PetscFunctionReturn(0); 137635e7444dSHong Zhang } 137735e7444dSHong Zhang 13789566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 137935e7444dSHong Zhang for (i = 0; i < n; i++) { 1380fdc842d1SBarry Smith x[i] = 0.0; 138135e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 138235e7444dSHong Zhang if (aj[j] == i) { 138335e7444dSHong Zhang x[i] = aa[j]; 138417ab2063SBarry Smith break; 138517ab2063SBarry Smith } 138617ab2063SBarry Smith } 138717ab2063SBarry Smith } 13889566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13903a40ed3dSBarry Smith PetscFunctionReturn(0); 139117ab2063SBarry Smith } 139217ab2063SBarry Smith 1393c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1394d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1395d71ae5a4SJacob Faibussowitsch { 1396416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13975f22a7b3SSebastian Grimberg const MatScalar *aa; 1398d9ca1df4SBarry Smith PetscScalar *y; 1399d9ca1df4SBarry Smith const PetscScalar *x; 1400d0f46423SBarry Smith PetscInt m = A->rmap->n; 14015c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14025f22a7b3SSebastian Grimberg const MatScalar *v; 1403a77337e4SBarry Smith PetscScalar alpha; 1404d9ca1df4SBarry Smith PetscInt n, i, j; 1405d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14063447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1407ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14085c897100SBarry Smith #endif 140917ab2063SBarry Smith 14103a40ed3dSBarry Smith PetscFunctionBegin; 14119566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14129566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14139566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14155c897100SBarry Smith 14165c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1417fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14185c897100SBarry Smith #else 14193447b6efSHong Zhang if (usecprow) { 14203447b6efSHong Zhang m = cprow.nrows; 14213447b6efSHong Zhang ii = cprow.i; 14227b2bb3b9SHong Zhang ridx = cprow.rindex; 14233447b6efSHong Zhang } else { 14243447b6efSHong Zhang ii = a->i; 14253447b6efSHong Zhang } 142617ab2063SBarry Smith for (i = 0; i < m; i++) { 14273447b6efSHong Zhang idx = a->j + ii[i]; 1428fff043a9SJunchao Zhang v = aa + ii[i]; 14293447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14303447b6efSHong Zhang if (usecprow) { 14317b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14323447b6efSHong Zhang } else { 143317ab2063SBarry Smith alpha = x[i]; 14343447b6efSHong Zhang } 143504fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 143617ab2063SBarry Smith } 14375c897100SBarry Smith #endif 14389566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14399566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14409566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14423a40ed3dSBarry Smith PetscFunctionReturn(0); 144317ab2063SBarry Smith } 144417ab2063SBarry Smith 1445d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1446d71ae5a4SJacob Faibussowitsch { 14475c897100SBarry Smith PetscFunctionBegin; 14489566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14499566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14505c897100SBarry Smith PetscFunctionReturn(0); 14515c897100SBarry Smith } 14525c897100SBarry Smith 1453c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 145478b84d54SShri Abhyankar 1455d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1456d71ae5a4SJacob Faibussowitsch { 1457416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1458d9fead3dSBarry Smith PetscScalar *y; 145954f21887SBarry Smith const PetscScalar *x; 1460fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1461003131ecSBarry Smith PetscInt m = A->rmap->n; 14620298fd71SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 14637b083b7cSBarry Smith PetscInt n, i; 1464362ced78SSatish Balay PetscScalar sum; 1465ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 146617ab2063SBarry Smith 1467b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 146897952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1469fee21e36SBarry Smith #endif 1470fee21e36SBarry Smith 14713a40ed3dSBarry Smith PetscFunctionBegin; 1472b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14739566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 1474b215bc84SStefano Zampini PetscFunctionReturn(0); 1475b215bc84SStefano Zampini } 14769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14779566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14789566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1479416022c9SBarry Smith ii = a->i; 14804eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14819566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 148297952fefSHong Zhang m = a->compressedrow.nrows; 148397952fefSHong Zhang ii = a->compressedrow.i; 148497952fefSHong Zhang ridx = a->compressedrow.rindex; 148597952fefSHong Zhang for (i = 0; i < m; i++) { 148697952fefSHong Zhang n = ii[i + 1] - ii[i]; 148797952fefSHong Zhang aj = a->j + ii[i]; 1488fff043a9SJunchao Zhang aa = a_a + ii[i]; 148997952fefSHong Zhang sum = 0.0; 1490003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1491003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 149297952fefSHong Zhang y[*ridx++] = sum; 149397952fefSHong Zhang } 149497952fefSHong Zhang } else { /* do not use compressed row format */ 1495b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 14963d3eaba7SBarry Smith aj = a->j; 1497fff043a9SJunchao Zhang aa = a_a; 1498b05257ddSBarry Smith fortranmultaij_(&m, x, ii, aj, aa, y); 1499b05257ddSBarry Smith #else 150017ab2063SBarry Smith for (i = 0; i < m; i++) { 1501003131ecSBarry Smith n = ii[i + 1] - ii[i]; 1502003131ecSBarry Smith aj = a->j + ii[i]; 1503fff043a9SJunchao Zhang aa = a_a + ii[i]; 150417ab2063SBarry Smith sum = 0.0; 1505003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 150617ab2063SBarry Smith y[i] = sum; 150717ab2063SBarry Smith } 15088d195f9aSBarry Smith #endif 1509b05257ddSBarry Smith } 15109566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15119566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15129566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15143a40ed3dSBarry Smith PetscFunctionReturn(0); 151517ab2063SBarry Smith } 151617ab2063SBarry Smith 1517d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1518d71ae5a4SJacob Faibussowitsch { 1519b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1520b434eb95SMatthew G. Knepley PetscScalar *y; 1521b434eb95SMatthew G. Knepley const PetscScalar *x; 1522fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1523b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1524b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1525b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1526b434eb95SMatthew G. Knepley PetscScalar sum; 1527b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1528b434eb95SMatthew G. Knepley 1529b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1530b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1531b434eb95SMatthew G. Knepley #endif 1532b434eb95SMatthew G. Knepley 1533b434eb95SMatthew G. Knepley PetscFunctionBegin; 15349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15359566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15369566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1537b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1538b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1539b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1540b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1541b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1542b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1543b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1544fff043a9SJunchao Zhang aa = a_a + ii[i]; 1545b434eb95SMatthew G. Knepley sum = 0.0; 1546b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1547b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1548b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1549b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1550b434eb95SMatthew G. Knepley } 1551b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15523d3eaba7SBarry Smith ii = a->i; 1553b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1554b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1555b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1556fff043a9SJunchao Zhang aa = a_a + ii[i]; 1557b434eb95SMatthew G. Knepley sum = 0.0; 1558b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1559b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1560b434eb95SMatthew G. Knepley y[i] = sum; 1561b434eb95SMatthew G. Knepley } 1562b434eb95SMatthew G. Knepley } 15639566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15649566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15659566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 1567b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1568b434eb95SMatthew G. Knepley } 1569b434eb95SMatthew G. Knepley 1570d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1571d71ae5a4SJacob Faibussowitsch { 1572b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1573b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1574b434eb95SMatthew G. Knepley const PetscScalar *x; 1575fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1576b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1577b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1578b434eb95SMatthew G. Knepley PetscScalar sum; 1579b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1580b434eb95SMatthew G. Knepley 1581b434eb95SMatthew G. Knepley PetscFunctionBegin; 15829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15839566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15849566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1585b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 158648a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1587b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1588b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1589b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1590b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1591b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1592b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1593fff043a9SJunchao Zhang aa = a_a + ii[i]; 1594b434eb95SMatthew G. Knepley sum = y[*ridx]; 1595b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1596b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1597b434eb95SMatthew G. Knepley } 1598b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15993d3eaba7SBarry Smith ii = a->i; 1600b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1601b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1602b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1603fff043a9SJunchao Zhang aa = a_a + ii[i]; 1604b434eb95SMatthew G. Knepley sum = y[i]; 1605b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1606b434eb95SMatthew G. Knepley z[i] = sum; 1607b434eb95SMatthew G. Knepley } 1608b434eb95SMatthew G. Knepley } 16099566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16109566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16119566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 1613b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1614b434eb95SMatthew G. Knepley } 1615b434eb95SMatthew G. Knepley 1616c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1617d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1618d71ae5a4SJacob Faibussowitsch { 1619416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1620f15663dcSBarry Smith PetscScalar *y, *z; 1621f15663dcSBarry Smith const PetscScalar *x; 1622fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1623d9ca1df4SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 1624d9ca1df4SBarry Smith PetscInt m = A->rmap->n, n, i; 1625362ced78SSatish Balay PetscScalar sum; 1626ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16279ea0dfa2SSatish Balay 16283a40ed3dSBarry Smith PetscFunctionBegin; 1629b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16309566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 1631b215bc84SStefano Zampini PetscFunctionReturn(0); 1632b215bc84SStefano Zampini } 16339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16349566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16359566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16364eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 163748a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 163897952fefSHong Zhang m = a->compressedrow.nrows; 163997952fefSHong Zhang ii = a->compressedrow.i; 164097952fefSHong Zhang ridx = a->compressedrow.rindex; 164197952fefSHong Zhang for (i = 0; i < m; i++) { 164297952fefSHong Zhang n = ii[i + 1] - ii[i]; 164397952fefSHong Zhang aj = a->j + ii[i]; 1644fff043a9SJunchao Zhang aa = a_a + ii[i]; 164597952fefSHong Zhang sum = y[*ridx]; 1646f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 164797952fefSHong Zhang z[*ridx++] = sum; 164897952fefSHong Zhang } 164997952fefSHong Zhang } else { /* do not use compressed row format */ 16503d3eaba7SBarry Smith ii = a->i; 1651f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16523d3eaba7SBarry Smith aj = a->j; 1653fff043a9SJunchao Zhang aa = a_a; 1654f15663dcSBarry Smith fortranmultaddaij_(&m, x, ii, aj, aa, y, z); 1655f15663dcSBarry Smith #else 165617ab2063SBarry Smith for (i = 0; i < m; i++) { 1657f15663dcSBarry Smith n = ii[i + 1] - ii[i]; 1658f15663dcSBarry Smith aj = a->j + ii[i]; 1659fff043a9SJunchao Zhang aa = a_a + ii[i]; 166017ab2063SBarry Smith sum = y[i]; 1661f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 166217ab2063SBarry Smith z[i] = sum; 166317ab2063SBarry Smith } 166402ab625aSSatish Balay #endif 1665f15663dcSBarry Smith } 16669566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16679566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16689566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16703a40ed3dSBarry Smith PetscFunctionReturn(0); 167117ab2063SBarry Smith } 167217ab2063SBarry Smith 167317ab2063SBarry Smith /* 167417ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 167517ab2063SBarry Smith */ 1676d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1677d71ae5a4SJacob Faibussowitsch { 1678416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1679d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1680c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 168117ab2063SBarry Smith 16823a40ed3dSBarry Smith PetscFunctionBegin; 168309f38230SBarry Smith if (!a->diag) { 16849566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1685c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 168609f38230SBarry Smith } 1687d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1688c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1689c0c07093SJunchao Zhang if (alreadySet) { 1690c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1691c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1692c0c07093SJunchao Zhang } 1693c0c07093SJunchao Zhang 169409f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1695bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1696bfeeae90SHong Zhang if (a->j[j] == i) { 169709f38230SBarry Smith a->diag[i] = j; 169817ab2063SBarry Smith break; 169917ab2063SBarry Smith } 170017ab2063SBarry Smith } 170117ab2063SBarry Smith } 17023a40ed3dSBarry Smith PetscFunctionReturn(0); 170317ab2063SBarry Smith } 170417ab2063SBarry Smith 1705d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1706d71ae5a4SJacob Faibussowitsch { 170761ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 170861ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 170961ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 171061ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 171161ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 171261ecd0c6SBarry Smith 171361ecd0c6SBarry Smith PetscFunctionBegin; 171461ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17169566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 171761ecd0c6SBarry Smith PetscFunctionReturn(0); 171861ecd0c6SBarry Smith } 171961ecd0c6SBarry Smith 172061ecd0c6SBarry Smith if (a->diagonaldense) { 172161ecd0c6SBarry Smith cnt = 0; 172261ecd0c6SBarry Smith } else { 17239566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 172461ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1725349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 172661ecd0c6SBarry Smith cnt++; 172761ecd0c6SBarry Smith mdiag[i] = 1; 172861ecd0c6SBarry Smith } 172961ecd0c6SBarry Smith } 173061ecd0c6SBarry Smith } 173161ecd0c6SBarry Smith if (!cnt) { 17329566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 173361ecd0c6SBarry Smith } else { 1734b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1735b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 173661ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij; 173761ecd0c6SBarry Smith 173861ecd0c6SBarry Smith a->a = NULL; 173961ecd0c6SBarry Smith a->j = NULL; 174061ecd0c6SBarry Smith a->i = NULL; 174161ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1742ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 174461ecd0c6SBarry Smith 174561ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 174661ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17479566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 174848a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1749447d62f5SStefano Zampini } 17509566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17519566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 175261ecd0c6SBarry Smith if (singlemalloc) { 17539566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda, oldj, oldi)); 175461ecd0c6SBarry Smith } else { 17559566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17569566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17579566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 175861ecd0c6SBarry Smith } 175961ecd0c6SBarry Smith } 17609566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 176161ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 176261ecd0c6SBarry Smith PetscFunctionReturn(0); 176361ecd0c6SBarry Smith } 176461ecd0c6SBarry Smith 1765be5855fcSBarry Smith /* 1766be5855fcSBarry Smith Checks for missing diagonals 1767be5855fcSBarry Smith */ 1768d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1769d71ae5a4SJacob Faibussowitsch { 1770be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17717734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1772be5855fcSBarry Smith 1773be5855fcSBarry Smith PetscFunctionBegin; 177409f38230SBarry Smith *missing = PETSC_FALSE; 17757734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 177609f38230SBarry Smith *missing = PETSC_TRUE; 177709f38230SBarry Smith if (d) *d = 0; 17789566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 177909f38230SBarry Smith } else { 178001445905SHong Zhang PetscInt n; 178101445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1782f1e2ffcdSBarry Smith diag = a->diag; 178301445905SHong Zhang for (i = 0; i < n; i++) { 17847734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 178509f38230SBarry Smith *missing = PETSC_TRUE; 178609f38230SBarry Smith if (d) *d = i; 17879566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1788358d2f5dSShri Abhyankar break; 178909f38230SBarry Smith } 1790be5855fcSBarry Smith } 1791be5855fcSBarry Smith } 1792be5855fcSBarry Smith PetscFunctionReturn(0); 1793be5855fcSBarry Smith } 1794be5855fcSBarry Smith 17950da83c2eSBarry Smith #include <petscblaslapack.h> 17960da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 17970da83c2eSBarry Smith 17980da83c2eSBarry Smith /* 17990da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18000da83c2eSBarry Smith */ 1801d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1802d71ae5a4SJacob Faibussowitsch { 18030da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18040da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18050da83c2eSBarry Smith const PetscReal shift = 0.0; 18060da83c2eSBarry Smith PetscInt ipvt[5]; 18074e208921SJed Brown PetscCount flops = 0; 18080da83c2eSBarry Smith PetscScalar work[25], *v_work; 18090da83c2eSBarry Smith 18100da83c2eSBarry Smith PetscFunctionBegin; 18110da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18120da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 181308401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1814ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18159566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 181648a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18170da83c2eSBarry Smith ncnt = 0; 18180da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18190da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18209566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18210da83c2eSBarry Smith switch (bsizes[i]) { 1822d71ae5a4SJacob Faibussowitsch case 1: 1823d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1824d71ae5a4SJacob Faibussowitsch break; 18250da83c2eSBarry Smith case 2: 18269566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18270da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18289566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18290da83c2eSBarry Smith break; 18300da83c2eSBarry Smith case 3: 18319566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18320da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18339566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18340da83c2eSBarry Smith break; 18350da83c2eSBarry Smith case 4: 18369566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18370da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18389566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18390da83c2eSBarry Smith break; 18400da83c2eSBarry Smith case 5: 18419566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18420da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18439566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18440da83c2eSBarry Smith break; 18450da83c2eSBarry Smith case 6: 18469566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18470da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18489566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18490da83c2eSBarry Smith break; 18500da83c2eSBarry Smith case 7: 18519566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18520da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18539566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18540da83c2eSBarry Smith break; 18550da83c2eSBarry Smith default: 18569566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18570da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18589566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18590da83c2eSBarry Smith } 18600da83c2eSBarry Smith ncnt += bsizes[i]; 18610da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 18624e208921SJed Brown flops += 2 * PetscPowInt(bsizes[i], 3) / 3; 18630da83c2eSBarry Smith } 18644e208921SJed Brown PetscLogFlops(flops); 186548a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18669566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18670da83c2eSBarry Smith PetscFunctionReturn(0); 18680da83c2eSBarry Smith } 18690da83c2eSBarry Smith 1870422a814eSBarry Smith /* 1871422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1872422a814eSBarry Smith */ 1873d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1874d71ae5a4SJacob Faibussowitsch { 187571f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1876d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18772e5835c6SStefano Zampini const MatScalar *v; 187854f21887SBarry Smith PetscScalar *idiag, *mdiag; 187971f1c65dSBarry Smith 188071f1c65dSBarry Smith PetscFunctionBegin; 188171f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 18829566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 188371f1c65dSBarry Smith diag = a->diag; 18844dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18852e5835c6SStefano Zampini 188671f1c65dSBarry Smith mdiag = a->mdiag; 188771f1c65dSBarry Smith idiag = a->idiag; 18889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1889422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 189071f1c65dSBarry Smith for (i = 0; i < m; i++) { 189171f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1892899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1893899639b0SHong Zhang if (PetscRealPart(fshift)) { 18949566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 18957b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18967b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 18977b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 189898921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1899899639b0SHong Zhang } 190071f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 190171f1c65dSBarry Smith } 19029566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 190371f1c65dSBarry Smith } else { 190471f1c65dSBarry Smith for (i = 0; i < m; i++) { 190571f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 190671f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 190771f1c65dSBarry Smith } 19089566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 190971f1c65dSBarry Smith } 191071f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 191271f1c65dSBarry Smith PetscFunctionReturn(0); 191371f1c65dSBarry Smith } 191471f1c65dSBarry Smith 1915c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 1916d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1917d71ae5a4SJacob Faibussowitsch { 1918416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1919e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19202e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 192154f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19223d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 192397f1f81fSBarry Smith const PetscInt *idx, *diag; 192417ab2063SBarry Smith 19253a40ed3dSBarry Smith PetscFunctionBegin; 1926b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19279566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 1928b215bc84SStefano Zampini PetscFunctionReturn(0); 1929b215bc84SStefano Zampini } 1930b965ef7fSBarry Smith its = its * lits; 193191723122SBarry Smith 193271f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19339566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 193471f1c65dSBarry Smith a->fshift = fshift; 193571f1c65dSBarry Smith a->omega = omega; 1936ed480e8bSBarry Smith 193771f1c65dSBarry Smith diag = a->diag; 193871f1c65dSBarry Smith t = a->ssor_work; 1939ed480e8bSBarry Smith idiag = a->idiag; 194071f1c65dSBarry Smith mdiag = a->mdiag; 1941ed480e8bSBarry Smith 19429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19439566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19449566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1945ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 194617ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 194717ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1948ed480e8bSBarry Smith bs = b; 194917ab2063SBarry Smith for (i = 0; i < m; i++) { 195071f1c65dSBarry Smith d = fshift + mdiag[i]; 1951416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1952ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19532e5835c6SStefano Zampini v = aa + diag[i] + 1; 195417ab2063SBarry Smith sum = b[i] * d / omega; 1955003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 195617ab2063SBarry Smith x[i] = sum; 195717ab2063SBarry Smith } 19589566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19599566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19619566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19623a40ed3dSBarry Smith PetscFunctionReturn(0); 196317ab2063SBarry Smith } 1964c783ea89SBarry Smith 196508401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1966f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19674c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1968887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 196917ab2063SBarry Smith 197017ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 197117ab2063SBarry Smith 1972887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 197317ab2063SBarry Smith */ 197417ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 197517ab2063SBarry Smith 197617ab2063SBarry Smith /* x = (E + U)^{-1} b */ 197717ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1978416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1979ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19802e5835c6SStefano Zampini v = aa + diag[i] + 1; 198117ab2063SBarry Smith sum = b[i]; 1982e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1983ed480e8bSBarry Smith x[i] = sum * idiag[i]; 198417ab2063SBarry Smith } 198517ab2063SBarry Smith 198617ab2063SBarry Smith /* t = b - (2*E - D)x */ 19872e5835c6SStefano Zampini v = aa; 19882205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 198917ab2063SBarry Smith 199017ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1991ed480e8bSBarry Smith ts = t; 1992416022c9SBarry Smith diag = a->diag; 199317ab2063SBarry Smith for (i = 0; i < m; i++) { 1994416022c9SBarry Smith n = diag[i] - a->i[i]; 1995ed480e8bSBarry Smith idx = a->j + a->i[i]; 19962e5835c6SStefano Zampini v = aa + a->i[i]; 199717ab2063SBarry Smith sum = t[i]; 1998003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 1999ed480e8bSBarry Smith t[i] = sum * idiag[i]; 2000733d66baSBarry Smith /* x = x + t */ 2001733d66baSBarry Smith x[i] += t[i]; 200217ab2063SBarry Smith } 200317ab2063SBarry Smith 20049566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20059566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20069566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20073a40ed3dSBarry Smith PetscFunctionReturn(0); 200817ab2063SBarry Smith } 200917ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 201017ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 201117ab2063SBarry Smith for (i = 0; i < m; i++) { 2012416022c9SBarry Smith n = diag[i] - a->i[i]; 2013ed480e8bSBarry Smith idx = a->j + a->i[i]; 20142e5835c6SStefano Zampini v = aa + a->i[i]; 201517ab2063SBarry Smith sum = b[i]; 2016e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20175c99c7daSBarry Smith t[i] = sum; 2018ed480e8bSBarry Smith x[i] = sum * idiag[i]; 201917ab2063SBarry Smith } 20205c99c7daSBarry Smith xb = t; 20219566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20223a40ed3dSBarry Smith } else xb = b; 202317ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 202417ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2025416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2026ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20272e5835c6SStefano Zampini v = aa + diag[i] + 1; 202817ab2063SBarry Smith sum = xb[i]; 2029e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20305c99c7daSBarry Smith if (xb == b) { 2031ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20325c99c7daSBarry Smith } else { 2033b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 203417ab2063SBarry Smith } 20355c99c7daSBarry Smith } 20369566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 203717ab2063SBarry Smith } 203817ab2063SBarry Smith its--; 203917ab2063SBarry Smith } 204017ab2063SBarry Smith while (its--) { 204117ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 204217ab2063SBarry Smith for (i = 0; i < m; i++) { 2043b19a5dc2SMark Adams /* lower */ 2044b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2045ed480e8bSBarry Smith idx = a->j + a->i[i]; 20462e5835c6SStefano Zampini v = aa + a->i[i]; 204717ab2063SBarry Smith sum = b[i]; 2048e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2049b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2050b19a5dc2SMark Adams /* upper */ 2051b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2052b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20532e5835c6SStefano Zampini v = aa + diag[i] + 1; 2054b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2055b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 205617ab2063SBarry Smith } 2057b19a5dc2SMark Adams xb = t; 20589566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2059b19a5dc2SMark Adams } else xb = b; 206017ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 206117ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2062b19a5dc2SMark Adams sum = xb[i]; 2063b19a5dc2SMark Adams if (xb == b) { 2064b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2065416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2066ed480e8bSBarry Smith idx = a->j + a->i[i]; 20672e5835c6SStefano Zampini v = aa + a->i[i]; 2068e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2069ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2070b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2071b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2072b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20732e5835c6SStefano Zampini v = aa + diag[i] + 1; 2074b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2075b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 207617ab2063SBarry Smith } 2077b19a5dc2SMark Adams } 2078b19a5dc2SMark Adams if (xb == b) { 20799566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2080b19a5dc2SMark Adams } else { 20819566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2082b19a5dc2SMark Adams } 208317ab2063SBarry Smith } 208417ab2063SBarry Smith } 20859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20869566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 2088365a8a9eSBarry Smith PetscFunctionReturn(0); 208917ab2063SBarry Smith } 209017ab2063SBarry Smith 2091d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2092d71ae5a4SJacob Faibussowitsch { 2093416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 20944e220ebcSLois Curfman McInnes 20953a40ed3dSBarry Smith PetscFunctionBegin; 20964e220ebcSLois Curfman McInnes info->block_size = 1.0; 20973966268fSBarry Smith info->nz_allocated = a->maxnz; 20983966268fSBarry Smith info->nz_used = a->nz; 20993966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21003966268fSBarry Smith info->assemblies = A->num_ass; 21013966268fSBarry Smith info->mallocs = A->info.mallocs; 21024dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2103d5f3da31SBarry Smith if (A->factortype) { 21044e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21054e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21064e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21074e220ebcSLois Curfman McInnes } else { 21084e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21094e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21104e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21114e220ebcSLois Curfman McInnes } 21123a40ed3dSBarry Smith PetscFunctionReturn(0); 211317ab2063SBarry Smith } 211417ab2063SBarry Smith 2115d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2116d71ae5a4SJacob Faibussowitsch { 2117416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2118c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 211997b48c8fSBarry Smith const PetscScalar *xx; 21202e5835c6SStefano Zampini PetscScalar *bb, *aa; 2121c7da8527SEric Chamberland PetscInt d = 0; 212217ab2063SBarry Smith 21233a40ed3dSBarry Smith PetscFunctionBegin; 212497b48c8fSBarry Smith if (x && b) { 21259566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21269566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 212797b48c8fSBarry Smith for (i = 0; i < N; i++) { 2128aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2129447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 213097b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 213197b48c8fSBarry Smith } 21329566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21339566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 213497b48c8fSBarry Smith } 213597b48c8fSBarry Smith 21369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2137a9817697SBarry Smith if (a->keepnonzeropattern) { 2138f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2139aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21409566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2141f1e2ffcdSBarry Smith } 2142f4df32b1SMatthew Knepley if (diag != 0.0) { 2143c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2144c7da8527SEric Chamberland d = rows[i]; 2145447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 214608401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2147c7da8527SEric Chamberland } 2148f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2149447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21502e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2151f1e2ffcdSBarry Smith } 2152f1e2ffcdSBarry Smith } 2153f1e2ffcdSBarry Smith } else { 2154f4df32b1SMatthew Knepley if (diag != 0.0) { 215517ab2063SBarry Smith for (i = 0; i < N; i++) { 2156aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21577ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2158447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2159447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2160447d62f5SStefano Zampini } else { 2161416022c9SBarry Smith a->ilen[rows[i]] = 1; 21622e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2163bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2164447d62f5SStefano Zampini } 2165447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21669566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 216717ab2063SBarry Smith } 216817ab2063SBarry Smith } 21693a40ed3dSBarry Smith } else { 217017ab2063SBarry Smith for (i = 0; i < N; i++) { 2171aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2172416022c9SBarry Smith a->ilen[rows[i]] = 0; 217317ab2063SBarry Smith } 217417ab2063SBarry Smith } 2175e56f5c9eSBarry Smith A->nonzerostate++; 2176f1e2ffcdSBarry Smith } 21779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2178dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21793a40ed3dSBarry Smith PetscFunctionReturn(0); 218017ab2063SBarry Smith } 218117ab2063SBarry Smith 2182d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2183d71ae5a4SJacob Faibussowitsch { 21846e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21856e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21862b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 21876e169961SBarry Smith const PetscScalar *xx; 21882e5835c6SStefano Zampini PetscScalar *bb, *aa; 21896e169961SBarry Smith 21906e169961SBarry Smith PetscFunctionBegin; 21912e5835c6SStefano Zampini if (!N) PetscFunctionReturn(0); 21929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 21936e169961SBarry Smith if (x && b) { 21949566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21959566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 21962b40b63fSBarry Smith vecs = PETSC_TRUE; 21976e169961SBarry Smith } 21989566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 21996e169961SBarry Smith for (i = 0; i < N; i++) { 2200aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 22019566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 22022205254eSKarl Rupp 22036e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22046e169961SBarry Smith } 22056e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22066e169961SBarry Smith if (!zeroed[i]) { 22076e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22084cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22092e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22102e5835c6SStefano Zampini aa[j] = 0.0; 22116e169961SBarry Smith } 22126e169961SBarry Smith } 22134cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22146e169961SBarry Smith } 22156e169961SBarry Smith if (x && b) { 22169566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22179566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22186e169961SBarry Smith } 22199566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22206e169961SBarry Smith if (diag != 0.0) { 22219566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22221d5a398dSstefano_zampini if (missing) { 22231d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22244cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2225aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22269566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22271d5a398dSstefano_zampini } 22281d5a398dSstefano_zampini } else { 2229ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22306e169961SBarry Smith } 22311d5a398dSstefano_zampini } 22329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2233dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22346e169961SBarry Smith PetscFunctionReturn(0); 22356e169961SBarry Smith } 22366e169961SBarry Smith 2237d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2238d71ae5a4SJacob Faibussowitsch { 2239fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2240fff043a9SJunchao Zhang const PetscScalar *aa; 2241fff043a9SJunchao Zhang PetscInt *itmp; 224217ab2063SBarry Smith 22433a40ed3dSBarry Smith PetscFunctionBegin; 22449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2245416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22462e5835c6SStefano Zampini if (v) *v = (PetscScalar *)(aa + a->i[row]); 224717ab2063SBarry Smith if (idx) { 2248bfeeae90SHong Zhang itmp = a->j + a->i[row]; 224926fbe8dcSKarl Rupp if (*nz) *idx = itmp; 2250f4259b30SLisandro Dalcin else *idx = NULL; 225117ab2063SBarry Smith } 22529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22533a40ed3dSBarry Smith PetscFunctionReturn(0); 225417ab2063SBarry Smith } 225517ab2063SBarry Smith 2256d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2257d71ae5a4SJacob Faibussowitsch { 22583a40ed3dSBarry Smith PetscFunctionBegin; 2259cb4a9cd9SHong Zhang if (nz) *nz = 0; 22602e5835c6SStefano Zampini if (idx) *idx = NULL; 22612e5835c6SStefano Zampini if (v) *v = NULL; 22623a40ed3dSBarry Smith PetscFunctionReturn(0); 226317ab2063SBarry Smith } 226417ab2063SBarry Smith 2265d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2266d71ae5a4SJacob Faibussowitsch { 2267416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22682e5835c6SStefano Zampini const MatScalar *v; 226936db0b34SBarry Smith PetscReal sum = 0.0; 227097f1f81fSBarry Smith PetscInt i, j; 227117ab2063SBarry Smith 22723a40ed3dSBarry Smith PetscFunctionBegin; 22739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 227417ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2275570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2276570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2277792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2278570b7f6dSBarry Smith #else 2279416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22809371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22819371c9d4SSatish Balay v++; 228217ab2063SBarry Smith } 22838f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2284570b7f6dSBarry Smith #endif 22859566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22863a40ed3dSBarry Smith } else if (type == NORM_1) { 228736db0b34SBarry Smith PetscReal *tmp; 228897f1f81fSBarry Smith PetscInt *jj = a->j; 22899566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2290064f8208SBarry Smith *nrm = 0.0; 2291416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 22929371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 22939371c9d4SSatish Balay v++; 229417ab2063SBarry Smith } 2295d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2296064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 229717ab2063SBarry Smith } 22989566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 22999566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 23003a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2301064f8208SBarry Smith *nrm = 0.0; 2302d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 23032e5835c6SStefano Zampini const PetscScalar *v2 = v + a->i[j]; 230417ab2063SBarry Smith sum = 0.0; 2305416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23069371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23079371c9d4SSatish Balay v2++; 230817ab2063SBarry Smith } 2309064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 231017ab2063SBarry Smith } 23119566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2312f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23143a40ed3dSBarry Smith PetscFunctionReturn(0); 231517ab2063SBarry Smith } 231617ab2063SBarry Smith 2317d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2318d71ae5a4SJacob Faibussowitsch { 23193d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 232054f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23212e5835c6SStefano Zampini const MatScalar *va, *vb; 232297f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2323cd0d46ebSvictorle 2324cd0d46ebSvictorle PetscFunctionBegin; 23259566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23269566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23275485867bSBarry Smith if (ma != nb || na != mb) { 23285485867bSBarry Smith *f = PETSC_FALSE; 23295485867bSBarry Smith PetscFunctionReturn(0); 23305485867bSBarry Smith } 23319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23339371c9d4SSatish Balay aii = aij->i; 23349371c9d4SSatish Balay bii = bij->i; 23359371c9d4SSatish Balay adx = aij->j; 23369371c9d4SSatish Balay bdx = bij->j; 23379566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23389566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2339cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2340cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2341cd0d46ebSvictorle 2342cd0d46ebSvictorle *f = PETSC_TRUE; 2343cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2344cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 234597f1f81fSBarry Smith PetscInt idc, idr; 23465485867bSBarry Smith PetscScalar vc, vr; 2347cd0d46ebSvictorle /* column/row index/value */ 23485485867bSBarry Smith idc = adx[aptr[i]]; 23495485867bSBarry Smith idr = bdx[bptr[idc]]; 23505485867bSBarry Smith vc = va[aptr[i]]; 23515485867bSBarry Smith vr = vb[bptr[idc]]; 23525485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23535485867bSBarry Smith *f = PETSC_FALSE; 23545485867bSBarry Smith goto done; 2355cd0d46ebSvictorle } else { 23565485867bSBarry Smith aptr[i]++; 23575485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2358cd0d46ebSvictorle } 2359cd0d46ebSvictorle } 2360cd0d46ebSvictorle } 2361cd0d46ebSvictorle done: 23629566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23639566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 2366cd0d46ebSvictorle PetscFunctionReturn(0); 2367cd0d46ebSvictorle } 2368cd0d46ebSvictorle 2369d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2370d71ae5a4SJacob Faibussowitsch { 23713d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 237254f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 237354f21887SBarry Smith MatScalar *va, *vb; 23741cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23751cbb95d3SBarry Smith 23761cbb95d3SBarry Smith PetscFunctionBegin; 23779566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23789566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23791cbb95d3SBarry Smith if (ma != nb || na != mb) { 23801cbb95d3SBarry Smith *f = PETSC_FALSE; 23811cbb95d3SBarry Smith PetscFunctionReturn(0); 23821cbb95d3SBarry Smith } 23839371c9d4SSatish Balay aii = aij->i; 23849371c9d4SSatish Balay bii = bij->i; 23859371c9d4SSatish Balay adx = aij->j; 23869371c9d4SSatish Balay bdx = bij->j; 23879371c9d4SSatish Balay va = aij->a; 23889371c9d4SSatish Balay vb = bij->a; 23899566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23911cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 23921cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 23931cbb95d3SBarry Smith 23941cbb95d3SBarry Smith *f = PETSC_TRUE; 23951cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 23961cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 23971cbb95d3SBarry Smith PetscInt idc, idr; 23981cbb95d3SBarry Smith PetscScalar vc, vr; 23991cbb95d3SBarry Smith /* column/row index/value */ 24001cbb95d3SBarry Smith idc = adx[aptr[i]]; 24011cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24021cbb95d3SBarry Smith vc = va[aptr[i]]; 24031cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24041cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24051cbb95d3SBarry Smith *f = PETSC_FALSE; 24061cbb95d3SBarry Smith goto done; 24071cbb95d3SBarry Smith } else { 24081cbb95d3SBarry Smith aptr[i]++; 24091cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24101cbb95d3SBarry Smith } 24111cbb95d3SBarry Smith } 24121cbb95d3SBarry Smith } 24131cbb95d3SBarry Smith done: 24149566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24159566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24161cbb95d3SBarry Smith PetscFunctionReturn(0); 24171cbb95d3SBarry Smith } 24181cbb95d3SBarry Smith 2419d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2420d71ae5a4SJacob Faibussowitsch { 24219e29f15eSvictorle PetscFunctionBegin; 24229566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f)); 24239e29f15eSvictorle PetscFunctionReturn(0); 24249e29f15eSvictorle } 24259e29f15eSvictorle 2426d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2427d71ae5a4SJacob Faibussowitsch { 24281cbb95d3SBarry Smith PetscFunctionBegin; 24299566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f)); 24301cbb95d3SBarry Smith PetscFunctionReturn(0); 24311cbb95d3SBarry Smith } 24321cbb95d3SBarry Smith 2433d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2434d71ae5a4SJacob Faibussowitsch { 2435416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2436fff8e43fSBarry Smith const PetscScalar *l, *r; 2437fff8e43fSBarry Smith PetscScalar x; 243854f21887SBarry Smith MatScalar *v; 2439fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2440fff8e43fSBarry Smith const PetscInt *jj; 244117ab2063SBarry Smith 24423a40ed3dSBarry Smith PetscFunctionBegin; 244317ab2063SBarry Smith if (ll) { 24443ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24453ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24469566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 244708401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24489566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 245017ab2063SBarry Smith for (i = 0; i < m; i++) { 245117ab2063SBarry Smith x = l[i]; 2452416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24532205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 245417ab2063SBarry Smith } 24559566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24569566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 245817ab2063SBarry Smith } 245917ab2063SBarry Smith if (rr) { 24609566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 246108401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24629566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24642e5835c6SStefano Zampini jj = a->j; 24652205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24679566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24689566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 246917ab2063SBarry Smith } 24709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24713a40ed3dSBarry Smith PetscFunctionReturn(0); 247217ab2063SBarry Smith } 247317ab2063SBarry Smith 2474d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2475d71ae5a4SJacob Faibussowitsch { 2476db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2477d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 247897f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24795d0c19d7SBarry Smith const PetscInt *irow, *icol; 24802e5835c6SStefano Zampini const PetscScalar *aa; 24815d0c19d7SBarry Smith PetscInt nrows, ncols; 248297f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 248354f21887SBarry Smith MatScalar *a_new, *mat_a; 2484416022c9SBarry Smith Mat C; 2485cdc6f3adSToby Isaac PetscBool stride; 248617ab2063SBarry Smith 24873a40ed3dSBarry Smith PetscFunctionBegin; 24889566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24899566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24909566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 249117ab2063SBarry Smith 24929566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2493ff718158SBarry Smith if (stride) { 24949566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2495ff718158SBarry Smith } else { 2496ff718158SBarry Smith first = 0; 2497ff718158SBarry Smith step = 0; 2498ff718158SBarry Smith } 2499fee21e36SBarry Smith if (stride && step == 1) { 250002834360SBarry Smith /* special case of contiguous rows */ 25019566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 250202834360SBarry Smith /* loop over new rows determining lens and starting points */ 250302834360SBarry Smith for (i = 0; i < nrows; i++) { 2504bfeeae90SHong Zhang kstart = ai[irow[i]]; 2505a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2506a91a9bebSLisandro Dalcin starts[i] = kstart; 250702834360SBarry Smith for (k = kstart; k < kend; k++) { 2508bfeeae90SHong Zhang if (aj[k] >= first) { 250902834360SBarry Smith starts[i] = k; 251002834360SBarry Smith break; 251102834360SBarry Smith } 251202834360SBarry Smith } 2513a2744918SBarry Smith sum = 0; 251402834360SBarry Smith while (k < kend) { 2515bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2516a2744918SBarry Smith sum++; 251702834360SBarry Smith } 2518a2744918SBarry Smith lens[i] = sum; 251902834360SBarry Smith } 252002834360SBarry Smith /* create submatrix */ 2521cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 252297f1f81fSBarry Smith PetscInt n_cols, n_rows; 25239566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2524aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25259566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 252608480c60SBarry Smith C = *B; 25273a40ed3dSBarry Smith } else { 25283bef6203SJed Brown PetscInt rbs, cbs; 25299566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25309566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25319566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25329566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25339566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25349566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 253608480c60SBarry Smith } 2537db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2538db02288aSLois Curfman McInnes 253902834360SBarry Smith /* loop over rows inserting into submatrix */ 2540db02288aSLois Curfman McInnes a_new = c->a; 2541db02288aSLois Curfman McInnes j_new = c->j; 2542db02288aSLois Curfman McInnes i_new = c->i; 25439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 254402834360SBarry Smith for (i = 0; i < nrows; i++) { 2545a2744918SBarry Smith ii = starts[i]; 2546a2744918SBarry Smith lensi = lens[i]; 2547ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25489566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2549a2744918SBarry Smith a_new += lensi; 2550a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2551a2744918SBarry Smith c->ilen[i] = lensi; 255202834360SBarry Smith } 25539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25549566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25553a40ed3dSBarry Smith } else { 25569566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25579566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25589566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25594dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25606bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25614dcab191SBarry Smith smap[icol[i]] = i + 1; 25624dcab191SBarry Smith } 25634dcab191SBarry Smith 256402834360SBarry Smith /* determine lens of each row */ 256502834360SBarry Smith for (i = 0; i < nrows; i++) { 2566bfeeae90SHong Zhang kstart = ai[irow[i]]; 256702834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 256802834360SBarry Smith lens[i] = 0; 256902834360SBarry Smith for (k = kstart; k < kend; k++) { 2570ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 257102834360SBarry Smith } 257202834360SBarry Smith } 257317ab2063SBarry Smith /* Create and fill new matrix */ 2574a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2575ace3abfcSBarry Smith PetscBool equal; 25760f5bd95cSBarry Smith 257799141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2578aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25799566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 258028b400f6SJacob Faibussowitsch PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong no of nonzeros"); 25819566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 258208480c60SBarry Smith C = *B; 25833a40ed3dSBarry Smith } else { 25843bef6203SJed Brown PetscInt rbs, cbs; 25859566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25869566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25879566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25889566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25899566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25909566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 259208480c60SBarry Smith } 25939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 259499141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 259517ab2063SBarry Smith for (i = 0; i < nrows; i++) { 259699141d43SSatish Balay row = irow[i]; 2597bfeeae90SHong Zhang kstart = ai[row]; 259899141d43SSatish Balay kend = kstart + a->ilen[row]; 2599bfeeae90SHong Zhang mat_i = c->i[i]; 260099141d43SSatish Balay mat_j = c->j + mat_i; 260199141d43SSatish Balay mat_a = c->a + mat_i; 260299141d43SSatish Balay mat_ilen = c->ilen + i; 260317ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2604bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2605ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26062e5835c6SStefano Zampini *mat_a++ = aa[k]; 260799141d43SSatish Balay (*mat_ilen)++; 260817ab2063SBarry Smith } 260917ab2063SBarry Smith } 261017ab2063SBarry Smith } 26119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 261202834360SBarry Smith /* Free work space */ 26139566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26149566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26159566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2616cdc6f3adSToby Isaac /* sort */ 2617cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2618cdc6f3adSToby Isaac PetscInt ilen; 2619cdc6f3adSToby Isaac 2620cdc6f3adSToby Isaac mat_i = c->i[i]; 2621cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2622cdc6f3adSToby Isaac mat_a = c->a + mat_i; 2623cdc6f3adSToby Isaac ilen = c->ilen[i]; 26249566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2625cdc6f3adSToby Isaac } 262602834360SBarry Smith } 26278c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26289566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2629305c6ccfSStefano Zampini #endif 26309566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26319566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 263217ab2063SBarry Smith 26339566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2634416022c9SBarry Smith *B = C; 26353a40ed3dSBarry Smith PetscFunctionReturn(0); 263617ab2063SBarry Smith } 263717ab2063SBarry Smith 2638d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2639d71ae5a4SJacob Faibussowitsch { 264082d44351SHong Zhang Mat B; 264182d44351SHong Zhang 264282d44351SHong Zhang PetscFunctionBegin; 2643c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26449566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26459566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26469566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26479566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26489566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 264982d44351SHong Zhang *subMat = B; 2650c2d650bdSHong Zhang } else { 26519566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2652c2d650bdSHong Zhang } 265382d44351SHong Zhang PetscFunctionReturn(0); 265482d44351SHong Zhang } 265582d44351SHong Zhang 2656d71ae5a4SJacob Faibussowitsch PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2657d71ae5a4SJacob Faibussowitsch { 265863b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 265963b91edcSBarry Smith Mat outA; 2660ace3abfcSBarry Smith PetscBool row_identity, col_identity; 266163b91edcSBarry Smith 26623a40ed3dSBarry Smith PetscFunctionBegin; 266308401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26641df811f5SHong Zhang 26659566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26669566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2667a871dcd8SBarry Smith 266863b91edcSBarry Smith outA = inA; 2669d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26709566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26719566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26722205254eSKarl Rupp 26739566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26749566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26752205254eSKarl Rupp 2676c3122656SLisandro Dalcin a->row = row; 26772205254eSKarl Rupp 26789566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26799566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26802205254eSKarl Rupp 2681c3122656SLisandro Dalcin a->col = col; 268263b91edcSBarry Smith 268336db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26849566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26859566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2686f0ec6fceSSatish Balay 268794a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26889566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 268994a9d846SBarry Smith } 269063b91edcSBarry Smith 26919566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2692137fb511SHong Zhang if (row_identity && col_identity) { 26939566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2694137fb511SHong Zhang } else { 26959566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2696137fb511SHong Zhang } 26973a40ed3dSBarry Smith PetscFunctionReturn(0); 2698a871dcd8SBarry Smith } 2699a871dcd8SBarry Smith 2700d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2701d71ae5a4SJacob Faibussowitsch { 2702f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2703dfa0f9e5SStefano Zampini PetscScalar *v; 2704c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 27053a40ed3dSBarry Smith 27063a40ed3dSBarry Smith PetscFunctionBegin; 27079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27089566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2709792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27109566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27133a40ed3dSBarry Smith PetscFunctionReturn(0); 2714f0b747eeSBarry Smith } 2715f0b747eeSBarry Smith 2716d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2717d71ae5a4SJacob Faibussowitsch { 271816b64355SHong Zhang PetscInt i; 271916b64355SHong Zhang 272016b64355SHong Zhang PetscFunctionBegin; 272116b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27229566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 272316b64355SHong Zhang 272448a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27259566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 272616b64355SHong Zhang 272716b64355SHong Zhang if (submatj->rbuf1) { 27289566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27299566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 273016b64355SHong Zhang } 273116b64355SHong Zhang 273248a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27339566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27349566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 273516b64355SHong Zhang } 273616b64355SHong Zhang 273716b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2738eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 27399566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27409566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 274116b64355SHong Zhang #else 27429566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 274316b64355SHong Zhang #endif 274416b64355SHong Zhang 274516b64355SHong Zhang if (!submatj->allcolumns) { 274616b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2747eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap)); 274816b64355SHong Zhang #else 27499566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 275016b64355SHong Zhang #endif 275116b64355SHong Zhang } 27529566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 275316b64355SHong Zhang 27549566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 275516b64355SHong Zhang PetscFunctionReturn(0); 275616b64355SHong Zhang } 275716b64355SHong Zhang 2758d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2759d71ae5a4SJacob Faibussowitsch { 276016b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27615c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 276216b64355SHong Zhang 276316b64355SHong Zhang PetscFunctionBegin; 27649566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27659566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 276616b64355SHong Zhang PetscFunctionReturn(0); 276716b64355SHong Zhang } 276816b64355SHong Zhang 276989a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2770d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2771d71ae5a4SJacob Faibussowitsch { 27722d033e1fSHong Zhang PetscInt i; 27730fb991dcSHong Zhang Mat C; 27740fb991dcSHong Zhang Mat_SeqAIJ *c; 27750fb991dcSHong Zhang Mat_SubSppt *submatj; 27762d033e1fSHong Zhang 27772d033e1fSHong Zhang PetscFunctionBegin; 27782d033e1fSHong Zhang for (i = 0; i < n; i++) { 27790fb991dcSHong Zhang C = (*mat)[i]; 27800fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27810fb991dcSHong Zhang submatj = c->submatis1; 27822d033e1fSHong Zhang if (submatj) { 2783682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 278426cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27859566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27869566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27879566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27883faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27899566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27909566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27919566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2792682e4c99SStefano Zampini } 27932d033e1fSHong Zhang } else { 27949566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 27952d033e1fSHong Zhang } 27962d033e1fSHong Zhang } 279786e85357SHong Zhang 279863a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 27999566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 280063a75b2aSHong Zhang 28019566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 28022d033e1fSHong Zhang PetscFunctionReturn(0); 28032d033e1fSHong Zhang } 28042d033e1fSHong Zhang 2805d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2806d71ae5a4SJacob Faibussowitsch { 280797f1f81fSBarry Smith PetscInt i; 2808cddf8d76SBarry Smith 28093a40ed3dSBarry Smith PetscFunctionBegin; 281048a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2811cddf8d76SBarry Smith 281248a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28133a40ed3dSBarry Smith PetscFunctionReturn(0); 2814cddf8d76SBarry Smith } 2815cddf8d76SBarry Smith 2816d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2817d71ae5a4SJacob Faibussowitsch { 2818e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28199a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28205d0c19d7SBarry Smith const PetscInt *idx; 28219a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2822f1af5d2fSBarry Smith PetscBT table; 2823bbd702dbSSatish Balay 28243a40ed3dSBarry Smith PetscFunctionBegin; 28259a88ca10SBarry Smith m = A->rmap->n / bs; 2826e4d965acSSatish Balay ai = a->i; 2827bfeeae90SHong Zhang aj = a->j; 28288a047759SSatish Balay 282908401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 283006763907SSatish Balay 28319566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28329566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 283306763907SSatish Balay 2834e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2835b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2836e4d965acSSatish Balay isz = 0; 28379566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2838e4d965acSSatish Balay 2839e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28409566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28419566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2842e4d965acSSatish Balay 28439a88ca10SBarry Smith if (bs > 1) { 28449a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28459a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28469a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28479a88ca10SBarry Smith } 28489a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28499a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28509a88ca10SBarry Smith 28519a88ca10SBarry Smith k = 0; 28529a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28539a88ca10SBarry Smith n = isz; 28549a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28559a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28569a88ca10SBarry Smith row = bs * nidx[k] + ll; 28579a88ca10SBarry Smith start = ai[row]; 28589a88ca10SBarry Smith end = ai[row + 1]; 28599a88ca10SBarry Smith for (l = start; l < end; l++) { 28609a88ca10SBarry Smith val = aj[l] / bs; 28619a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28629a88ca10SBarry Smith } 28639a88ca10SBarry Smith } 28649a88ca10SBarry Smith } 28659a88ca10SBarry Smith } 28669a88ca10SBarry Smith PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i))); 28679a88ca10SBarry Smith } else { 2868dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2869e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28702205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28714dcbc457SBarry Smith } 28729566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28739566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2874e4d965acSSatish Balay 287504a348a9SBarry Smith k = 0; 287604a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 287704a348a9SBarry Smith n = isz; 287806763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2879e4d965acSSatish Balay row = nidx[k]; 2880e4d965acSSatish Balay start = ai[row]; 2881e4d965acSSatish Balay end = ai[row + 1]; 288204a348a9SBarry Smith for (l = start; l < end; l++) { 2883efb16452SHong Zhang val = aj[l]; 28842205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2885e4d965acSSatish Balay } 2886e4d965acSSatish Balay } 2887e4d965acSSatish Balay } 28889566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2889e4d965acSSatish Balay } 28909a88ca10SBarry Smith } 28919566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28929566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28933a40ed3dSBarry Smith PetscFunctionReturn(0); 28944dcbc457SBarry Smith } 289517ab2063SBarry Smith 28960513a670SBarry Smith /* -------------------------------------------------------------- */ 2897d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2898d71ae5a4SJacob Faibussowitsch { 28990513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29003b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 29015d0c19d7SBarry Smith const PetscInt *row, *col; 29025d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 290356cd22aeSBarry Smith IS icolp, irowp; 29040298fd71SBarry Smith PetscInt *cwork = NULL; 29050298fd71SBarry Smith PetscScalar *vwork = NULL; 29060513a670SBarry Smith 29073a40ed3dSBarry Smith PetscFunctionBegin; 29089566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29099566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29109566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29119566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29120513a670SBarry Smith 29130513a670SBarry Smith /* determine lengths of permuted rows */ 29149566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29152205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29169566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29179566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29189566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29199566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29219566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29220513a670SBarry Smith 29239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29240513a670SBarry Smith for (i = 0; i < m; i++) { 29259566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29262205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29279566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29289566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29290513a670SBarry Smith } 29309566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29312205254eSKarl Rupp 29323c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29332205254eSKarl Rupp 29348c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29359566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29369fe5e383SStefano Zampini #endif 29379566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29389566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29399566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29409566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29419566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29429566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 294348a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29443a40ed3dSBarry Smith PetscFunctionReturn(0); 29450513a670SBarry Smith } 29460513a670SBarry Smith 2947d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2948d71ae5a4SJacob Faibussowitsch { 2949cb5b572fSBarry Smith PetscFunctionBegin; 295033f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 295133f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2952be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2953be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29542e5835c6SStefano Zampini const PetscScalar *aa; 2955be6bf707SBarry Smith 29569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 295708401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29589566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29599566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2961cb5b572fSBarry Smith } else { 29629566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2963cb5b572fSBarry Smith } 2964cb5b572fSBarry Smith PetscFunctionReturn(0); 2965cb5b572fSBarry Smith } 2966cb5b572fSBarry Smith 2967d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetUp_SeqAIJ(Mat A) 2968d71ae5a4SJacob Faibussowitsch { 2969273d9f13SBarry Smith PetscFunctionBegin; 29709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, PETSC_DEFAULT, NULL)); 2971273d9f13SBarry Smith PetscFunctionReturn(0); 2972273d9f13SBarry Smith } 2973273d9f13SBarry Smith 2974d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2975d71ae5a4SJacob Faibussowitsch { 29766c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29776e111a19SKarl Rupp 29786c0721eeSBarry Smith PetscFunctionBegin; 29796c0721eeSBarry Smith *array = a->a; 29806c0721eeSBarry Smith PetscFunctionReturn(0); 29816c0721eeSBarry Smith } 29826c0721eeSBarry Smith 2983d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2984d71ae5a4SJacob Faibussowitsch { 29856c0721eeSBarry Smith PetscFunctionBegin; 2986f38c1e66SStefano Zampini *array = NULL; 29876c0721eeSBarry Smith PetscFunctionReturn(0); 29886c0721eeSBarry Smith } 2989273d9f13SBarry Smith 29908229c054SShri Abhyankar /* 29918229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29928229c054SShri Abhyankar have different nonzero structure. 29938229c054SShri Abhyankar */ 2994d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2995d71ae5a4SJacob Faibussowitsch { 2996b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2997ec7775f6SShri Abhyankar 2998ec7775f6SShri Abhyankar PetscFunctionBegin; 2999ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 3000ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 3001b264fe52SHong Zhang const PetscInt *xjj = xj + xi[i], *yjj = yj + yi[i]; 3002b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 3003b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 30048af7cee1SJed Brown nnz[i] = 0; 30058af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 3006b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 3007b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 30088af7cee1SJed Brown nnz[i]++; 30098af7cee1SJed Brown } 30108af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 3011ec7775f6SShri Abhyankar } 3012ec7775f6SShri Abhyankar PetscFunctionReturn(0); 3013ec7775f6SShri Abhyankar } 3014ec7775f6SShri Abhyankar 3015d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3016d71ae5a4SJacob Faibussowitsch { 3017b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3018b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3019b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3020b264fe52SHong Zhang 3021b264fe52SHong Zhang PetscFunctionBegin; 3022b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30239566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 3024b264fe52SHong Zhang PetscFunctionReturn(0); 3025b264fe52SHong Zhang } 3026b264fe52SHong Zhang 3027d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3028d71ae5a4SJacob Faibussowitsch { 3029ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3030ac90fabeSBarry Smith 3031ac90fabeSBarry Smith PetscFunctionBegin; 3032134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3033134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3034134adf20SPierre Jolivet if (e) { 30359566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 303681fa06acSBarry Smith if (e) { 30379566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3038134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 303981fa06acSBarry Smith } 304081fa06acSBarry Smith } 304154c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 304281fa06acSBarry Smith } 3043ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30442e5835c6SStefano Zampini const PetscScalar *xa; 30452e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 304681fa06acSBarry Smith PetscBLASInt one = 1, bnz; 304781fa06acSBarry Smith 30489566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3051792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30549566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30569566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3057ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30589566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3059ac90fabeSBarry Smith } else { 30608229c054SShri Abhyankar Mat B; 30618229c054SShri Abhyankar PetscInt *nnz; 30629566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30639566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30649566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30659566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30669566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30679566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30699566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30709566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30719bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30729566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3073ac90fabeSBarry Smith } 3074ac90fabeSBarry Smith PetscFunctionReturn(0); 3075ac90fabeSBarry Smith } 3076ac90fabeSBarry Smith 3077d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3078d71ae5a4SJacob Faibussowitsch { 3079354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3080354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3081354c94deSBarry Smith PetscInt i, nz; 3082354c94deSBarry Smith PetscScalar *a; 3083354c94deSBarry Smith 3084354c94deSBarry Smith PetscFunctionBegin; 3085354c94deSBarry Smith nz = aij->nz; 30869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30872205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3089354c94deSBarry Smith #else 3090354c94deSBarry Smith PetscFunctionBegin; 3091354c94deSBarry Smith #endif 3092354c94deSBarry Smith PetscFunctionReturn(0); 3093354c94deSBarry Smith } 3094354c94deSBarry Smith 3095d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3096d71ae5a4SJacob Faibussowitsch { 3097e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3098d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3099e34fafa9SBarry Smith PetscReal atmp; 3100985db425SBarry Smith PetscScalar *x; 3101ce496241SStefano Zampini const MatScalar *aa, *av; 3102e34fafa9SBarry Smith 3103e34fafa9SBarry Smith PetscFunctionBegin; 310428b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3106ce496241SStefano Zampini aa = av; 3107e34fafa9SBarry Smith ai = a->i; 3108e34fafa9SBarry Smith aj = a->j; 3109e34fafa9SBarry Smith 31109566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31119566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31129566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 311308401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3114e34fafa9SBarry Smith for (i = 0; i < m; i++) { 31159371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31169371c9d4SSatish Balay ai++; 3117e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3118985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31199371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31209371c9d4SSatish Balay x[i] = atmp; 31219371c9d4SSatish Balay if (idx) idx[i] = *aj; 31229371c9d4SSatish Balay } 31239371c9d4SSatish Balay aa++; 31249371c9d4SSatish Balay aj++; 3125985db425SBarry Smith } 3126985db425SBarry Smith } 31279566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3129985db425SBarry Smith PetscFunctionReturn(0); 3130985db425SBarry Smith } 3131985db425SBarry Smith 3132d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3133d71ae5a4SJacob Faibussowitsch { 3134985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3135d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3136985db425SBarry Smith PetscScalar *x; 3137ce496241SStefano Zampini const MatScalar *aa, *av; 3138985db425SBarry Smith 3139985db425SBarry Smith PetscFunctionBegin; 314028b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3142ce496241SStefano Zampini aa = av; 3143985db425SBarry Smith ai = a->i; 3144985db425SBarry Smith aj = a->j; 3145985db425SBarry Smith 31469566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31479566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31489566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 314908401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3150985db425SBarry Smith for (i = 0; i < m; i++) { 31519371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31529371c9d4SSatish Balay ai++; 3153d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31549371c9d4SSatish Balay x[i] = *aa; 31559371c9d4SSatish Balay if (idx) idx[i] = 0; 3156985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3157985db425SBarry Smith x[i] = 0.0; 3158985db425SBarry Smith if (idx) { 3159985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3160985db425SBarry Smith if (aj[j] > j) { 3161985db425SBarry Smith idx[i] = j; 3162985db425SBarry Smith break; 3163985db425SBarry Smith } 3164985db425SBarry Smith } 31651a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31661a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3167985db425SBarry Smith } 3168985db425SBarry Smith } 3169985db425SBarry Smith for (j = 0; j < ncols; j++) { 31709371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31719371c9d4SSatish Balay x[i] = *aa; 31729371c9d4SSatish Balay if (idx) idx[i] = *aj; 31739371c9d4SSatish Balay } 31749371c9d4SSatish Balay aa++; 31759371c9d4SSatish Balay aj++; 3176985db425SBarry Smith } 3177985db425SBarry Smith } 31789566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3180985db425SBarry Smith PetscFunctionReturn(0); 3181985db425SBarry Smith } 3182985db425SBarry Smith 3183d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3184d71ae5a4SJacob Faibussowitsch { 3185c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3186c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3187ce496241SStefano Zampini PetscScalar *x; 3188ce496241SStefano Zampini const MatScalar *aa, *av; 3189c87e5d42SMatthew Knepley 3190c87e5d42SMatthew Knepley PetscFunctionBegin; 31919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3192ce496241SStefano Zampini aa = av; 3193c87e5d42SMatthew Knepley ai = a->i; 3194c87e5d42SMatthew Knepley aj = a->j; 3195c87e5d42SMatthew Knepley 31969566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31979566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31989566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 319908401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3200c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 32019371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32029371c9d4SSatish Balay ai++; 3203f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32049371c9d4SSatish Balay x[i] = *aa; 32059371c9d4SSatish Balay if (idx) idx[i] = 0; 3206f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3207f07e67edSHong Zhang x[i] = 0.0; 3208f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3209289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3210f07e67edSHong Zhang if (aj[j] > j) { 3211f07e67edSHong Zhang idx[i] = j; 32122205254eSKarl Rupp break; 32132205254eSKarl Rupp } 3214289a08f5SMatthew Knepley } 3215f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3216f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3217f07e67edSHong Zhang } 3218289a08f5SMatthew Knepley } 3219c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32209371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32219371c9d4SSatish Balay x[i] = *aa; 32229371c9d4SSatish Balay if (idx) idx[i] = *aj; 32239371c9d4SSatish Balay } 32249371c9d4SSatish Balay aa++; 32259371c9d4SSatish Balay aj++; 3226c87e5d42SMatthew Knepley } 3227c87e5d42SMatthew Knepley } 32289566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3230c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3231c87e5d42SMatthew Knepley } 3232c87e5d42SMatthew Knepley 3233d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3234d71ae5a4SJacob Faibussowitsch { 3235985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3236d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3237d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3238985db425SBarry Smith PetscScalar *x; 3239ce496241SStefano Zampini const MatScalar *aa, *av; 3240985db425SBarry Smith 3241985db425SBarry Smith PetscFunctionBegin; 324228b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3244ce496241SStefano Zampini aa = av; 3245985db425SBarry Smith ai = a->i; 3246985db425SBarry Smith aj = a->j; 3247985db425SBarry Smith 32489566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32499566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32509566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 325108401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3252985db425SBarry Smith for (i = 0; i < m; i++) { 32539371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32549371c9d4SSatish Balay ai++; 3255d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32569371c9d4SSatish Balay x[i] = *aa; 32579371c9d4SSatish Balay if (idx) idx[i] = 0; 3258985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3259985db425SBarry Smith x[i] = 0.0; 3260985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3261985db425SBarry Smith for (j = 0; j < ncols; j++) { 3262985db425SBarry Smith if (aj[j] > j) { 3263985db425SBarry Smith idx[i] = j; 3264985db425SBarry Smith break; 3265985db425SBarry Smith } 3266985db425SBarry Smith } 3267fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3268fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3269985db425SBarry Smith } 3270985db425SBarry Smith } 3271985db425SBarry Smith for (j = 0; j < ncols; j++) { 32729371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32739371c9d4SSatish Balay x[i] = *aa; 32749371c9d4SSatish Balay if (idx) idx[i] = *aj; 32759371c9d4SSatish Balay } 32769371c9d4SSatish Balay aa++; 32779371c9d4SSatish Balay aj++; 3278e34fafa9SBarry Smith } 3279e34fafa9SBarry Smith } 32809566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3282e34fafa9SBarry Smith PetscFunctionReturn(0); 3283e34fafa9SBarry Smith } 3284bbead8a2SBarry Smith 3285d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3286d71ae5a4SJacob Faibussowitsch { 3287bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 328833d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3289bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 32900da83c2eSBarry Smith const PetscReal shift = 0.0; 32911a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3292bbead8a2SBarry Smith 3293bbead8a2SBarry Smith PetscFunctionBegin; 3294a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 32954a0d0026SBarry Smith if (a->ibdiagvalid) { 32964a0d0026SBarry Smith if (values) *values = a->ibdiag; 32974a0d0026SBarry Smith PetscFunctionReturn(0); 32984a0d0026SBarry Smith } 32999566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 33004dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3301bbead8a2SBarry Smith diag = a->ibdiag; 3302bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3303bbead8a2SBarry Smith /* factor and invert each block */ 3304bbead8a2SBarry Smith switch (bs) { 3305bbead8a2SBarry Smith case 1: 3306bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33079566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3308ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3309ec1892c8SHong Zhang if (allowzeropivot) { 33107b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33117b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33127b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33139566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 331498921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3315ec1892c8SHong Zhang } 3316bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3317bbead8a2SBarry Smith } 3318bbead8a2SBarry Smith break; 3319bbead8a2SBarry Smith case 2: 3320bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33219371c9d4SSatish Balay ij[0] = 2 * i; 33229371c9d4SSatish Balay ij[1] = 2 * i + 1; 33239566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33249566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33257b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33269566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3327bbead8a2SBarry Smith diag += 4; 3328bbead8a2SBarry Smith } 3329bbead8a2SBarry Smith break; 3330bbead8a2SBarry Smith case 3: 3331bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33329371c9d4SSatish Balay ij[0] = 3 * i; 33339371c9d4SSatish Balay ij[1] = 3 * i + 1; 33349371c9d4SSatish Balay ij[2] = 3 * i + 2; 33359566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33369566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33377b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33389566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3339bbead8a2SBarry Smith diag += 9; 3340bbead8a2SBarry Smith } 3341bbead8a2SBarry Smith break; 3342bbead8a2SBarry Smith case 4: 3343bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33449371c9d4SSatish Balay ij[0] = 4 * i; 33459371c9d4SSatish Balay ij[1] = 4 * i + 1; 33469371c9d4SSatish Balay ij[2] = 4 * i + 2; 33479371c9d4SSatish Balay ij[3] = 4 * i + 3; 33489566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33499566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33507b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33519566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3352bbead8a2SBarry Smith diag += 16; 3353bbead8a2SBarry Smith } 3354bbead8a2SBarry Smith break; 3355bbead8a2SBarry Smith case 5: 3356bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33579371c9d4SSatish Balay ij[0] = 5 * i; 33589371c9d4SSatish Balay ij[1] = 5 * i + 1; 33599371c9d4SSatish Balay ij[2] = 5 * i + 2; 33609371c9d4SSatish Balay ij[3] = 5 * i + 3; 33619371c9d4SSatish Balay ij[4] = 5 * i + 4; 33629566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33639566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33647b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33659566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3366bbead8a2SBarry Smith diag += 25; 3367bbead8a2SBarry Smith } 3368bbead8a2SBarry Smith break; 3369bbead8a2SBarry Smith case 6: 3370bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33719371c9d4SSatish Balay ij[0] = 6 * i; 33729371c9d4SSatish Balay ij[1] = 6 * i + 1; 33739371c9d4SSatish Balay ij[2] = 6 * i + 2; 33749371c9d4SSatish Balay ij[3] = 6 * i + 3; 33759371c9d4SSatish Balay ij[4] = 6 * i + 4; 33769371c9d4SSatish Balay ij[5] = 6 * i + 5; 33779566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33789566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33797b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33809566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3381bbead8a2SBarry Smith diag += 36; 3382bbead8a2SBarry Smith } 3383bbead8a2SBarry Smith break; 3384bbead8a2SBarry Smith case 7: 3385bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33869371c9d4SSatish Balay ij[0] = 7 * i; 33879371c9d4SSatish Balay ij[1] = 7 * i + 1; 33889371c9d4SSatish Balay ij[2] = 7 * i + 2; 33899371c9d4SSatish Balay ij[3] = 7 * i + 3; 33909371c9d4SSatish Balay ij[4] = 7 * i + 4; 33919371c9d4SSatish Balay ij[5] = 7 * i + 5; 3392cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 33939566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 33949566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 33957b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33969566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3397bbead8a2SBarry Smith diag += 49; 3398bbead8a2SBarry Smith } 3399bbead8a2SBarry Smith break; 3400bbead8a2SBarry Smith default: 34019566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3402bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3403ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34049566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34059566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34067b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34079566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3408bbead8a2SBarry Smith diag += bs2; 3409bbead8a2SBarry Smith } 34109566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3411bbead8a2SBarry Smith } 3412bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3413bbead8a2SBarry Smith PetscFunctionReturn(0); 3414bbead8a2SBarry Smith } 3415bbead8a2SBarry Smith 3416d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3417d71ae5a4SJacob Faibussowitsch { 341873a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3419fff043a9SJunchao Zhang PetscScalar a, *aa; 342073a71a0fSBarry Smith PetscInt m, n, i, j, col; 342173a71a0fSBarry Smith 342273a71a0fSBarry Smith PetscFunctionBegin; 342373a71a0fSBarry Smith if (!x->assembled) { 34249566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 342573a71a0fSBarry Smith for (i = 0; i < m; i++) { 342673a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34279566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 342873a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34299566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 343073a71a0fSBarry Smith } 343173a71a0fSBarry Smith } 3432e2ce353bSJunchao Zhang } else { 34339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34349566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3436e2ce353bSJunchao Zhang } 34379566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34389566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 343973a71a0fSBarry Smith PetscFunctionReturn(0); 344073a71a0fSBarry Smith } 344173a71a0fSBarry Smith 3442679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3443d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3444d71ae5a4SJacob Faibussowitsch { 3445679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3446679944adSJunchao Zhang PetscScalar a; 3447679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3448679944adSJunchao Zhang 3449679944adSJunchao Zhang PetscFunctionBegin; 3450679944adSJunchao Zhang nskip = high - low; 34519566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3452679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3453679944adSJunchao Zhang for (i = 0; i < m; i++) { 3454679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34559566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3456679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3457679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34589566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3459679944adSJunchao Zhang } 3460e2ce353bSJunchao Zhang } 34619566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34629566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 3463679944adSJunchao Zhang PetscFunctionReturn(0); 3464679944adSJunchao Zhang } 3465679944adSJunchao Zhang 3466682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 34670a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3468cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3469cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3470cb5b572fSBarry Smith MatMult_SeqAIJ, 347197304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34727c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34737c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3474f4259b30SLisandro Dalcin NULL, 3475f4259b30SLisandro Dalcin NULL, 3476f4259b30SLisandro Dalcin NULL, 3477f4259b30SLisandro Dalcin /* 10*/ NULL, 3478cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3479f4259b30SLisandro Dalcin NULL, 348041f059aeSBarry Smith MatSOR_SeqAIJ, 348191e9d3e2SHong Zhang MatTranspose_SeqAIJ, 348297304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3483cb5b572fSBarry Smith MatEqual_SeqAIJ, 3484cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3485cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3486cb5b572fSBarry Smith MatNorm_SeqAIJ, 3487f4259b30SLisandro Dalcin /* 20*/ NULL, 3488cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3489cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3490cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3491d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3492f4259b30SLisandro Dalcin NULL, 3493f4259b30SLisandro Dalcin NULL, 3494f4259b30SLisandro Dalcin NULL, 3495f4259b30SLisandro Dalcin NULL, 34964994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3497f4259b30SLisandro Dalcin NULL, 3498f4259b30SLisandro Dalcin NULL, 3499f4259b30SLisandro Dalcin NULL, 3500f4259b30SLisandro Dalcin NULL, 3501d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3502f4259b30SLisandro Dalcin NULL, 3503f4259b30SLisandro Dalcin NULL, 3504cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3505f4259b30SLisandro Dalcin NULL, 3506d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35077dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3508cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3509cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3510cb5b572fSBarry Smith MatCopy_SeqAIJ, 3511d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3512cb5b572fSBarry Smith MatScale_SeqAIJ, 35137d68702bSBarry Smith MatShift_SeqAIJ, 351479299369SBarry Smith MatDiagonalSet_SeqAIJ, 35156e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 351673a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35173b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35183b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35193b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3520a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 352193dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3522f4259b30SLisandro Dalcin NULL, 3523f4259b30SLisandro Dalcin NULL, 3524cda55fadSBarry Smith MatPermute_SeqAIJ, 3525f4259b30SLisandro Dalcin NULL, 3526f4259b30SLisandro Dalcin /* 59*/ NULL, 3527b9b97703SBarry Smith MatDestroy_SeqAIJ, 3528b9b97703SBarry Smith MatView_SeqAIJ, 3529f4259b30SLisandro Dalcin NULL, 3530f4259b30SLisandro Dalcin NULL, 3531f4259b30SLisandro Dalcin /* 64*/ NULL, 3532321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3533f4259b30SLisandro Dalcin NULL, 3534f4259b30SLisandro Dalcin NULL, 3535f4259b30SLisandro Dalcin NULL, 3536d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3537c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3538f4259b30SLisandro Dalcin NULL, 3539f4259b30SLisandro Dalcin NULL, 3540f4259b30SLisandro Dalcin NULL, 3541f4259b30SLisandro Dalcin /* 74*/ NULL, 35423acb8795SBarry Smith MatFDColoringApply_AIJ, 3543f4259b30SLisandro Dalcin NULL, 3544f4259b30SLisandro Dalcin NULL, 3545f4259b30SLisandro Dalcin NULL, 35466ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3547f4259b30SLisandro Dalcin NULL, 3548f4259b30SLisandro Dalcin NULL, 3549f4259b30SLisandro Dalcin NULL, 3550bc011b1eSHong Zhang MatLoad_SeqAIJ, 3551d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35521cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3553f4259b30SLisandro Dalcin NULL, 3554f4259b30SLisandro Dalcin NULL, 3555f4259b30SLisandro Dalcin NULL, 3556f4259b30SLisandro Dalcin /* 89*/ NULL, 3557f4259b30SLisandro Dalcin NULL, 355826be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3559f4259b30SLisandro Dalcin NULL, 3560f4259b30SLisandro Dalcin NULL, 35618fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3562f4259b30SLisandro Dalcin NULL, 3563f4259b30SLisandro Dalcin NULL, 35646fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3565f4259b30SLisandro Dalcin NULL, 35664222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3567f4259b30SLisandro Dalcin NULL, 3568f4259b30SLisandro Dalcin NULL, 356987d4246cSBarry Smith MatConjugate_SeqAIJ, 3570f4259b30SLisandro Dalcin NULL, 3571d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 357299cafbc1SBarry Smith MatRealPart_SeqAIJ, 3573f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3574f4259b30SLisandro Dalcin NULL, 3575f4259b30SLisandro Dalcin NULL, 3576cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3577f4259b30SLisandro Dalcin NULL, 35782af78befSBarry Smith MatGetRowMin_SeqAIJ, 3579f4259b30SLisandro Dalcin NULL, 3580599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3581f4259b30SLisandro Dalcin /*114*/ NULL, 3582f4259b30SLisandro Dalcin NULL, 3583f4259b30SLisandro Dalcin NULL, 3584f4259b30SLisandro Dalcin NULL, 3585f4259b30SLisandro Dalcin NULL, 3586f4259b30SLisandro Dalcin /*119*/ NULL, 3587f4259b30SLisandro Dalcin NULL, 3588f4259b30SLisandro Dalcin NULL, 3589f4259b30SLisandro Dalcin NULL, 3590b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 35910716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3592a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 359337868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 35940da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3595f4259b30SLisandro Dalcin NULL, 3596f4259b30SLisandro Dalcin /*129*/ NULL, 3597f4259b30SLisandro Dalcin NULL, 3598f4259b30SLisandro Dalcin NULL, 359975648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3600b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3601b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36022b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3603f4259b30SLisandro Dalcin NULL, 3604f4259b30SLisandro Dalcin NULL, 36053964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3606f4259b30SLisandro Dalcin /*139*/ NULL, 3607f4259b30SLisandro Dalcin NULL, 3608f4259b30SLisandro Dalcin NULL, 36093a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36109c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36114222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36124222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3613f4259b30SLisandro Dalcin NULL, 361472833a62Smarkadams4 NULL, 361572833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36162d776b49SBarry Smith NULL, 3617dec0b466SHong Zhang /*150*/ MatTransposeSymbolic_SeqAIJ, 3618dec0b466SHong Zhang MatEliminateZeros_SeqAIJ}; 361917ab2063SBarry Smith 3620d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3621d71ae5a4SJacob Faibussowitsch { 3622bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 362397f1f81fSBarry Smith PetscInt i, nz, n; 3624bef8e0ddSBarry Smith 3625bef8e0ddSBarry Smith PetscFunctionBegin; 3626bef8e0ddSBarry Smith nz = aij->maxnz; 3627d0f46423SBarry Smith n = mat->rmap->n; 3628ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3629bef8e0ddSBarry Smith aij->nz = nz; 3630ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 3631bef8e0ddSBarry Smith PetscFunctionReturn(0); 3632bef8e0ddSBarry Smith } 3633bef8e0ddSBarry Smith 3634a3bb6f32SFande Kong /* 3635ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3636ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3637ddea5d60SJunchao Zhang */ 3638d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3639d71ae5a4SJacob Faibussowitsch { 3640a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3641eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3642eec179cfSJacob Faibussowitsch PetscHashIter tpos; 364325b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 364425b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3645a3bb6f32SFande Kong 3646a3bb6f32SFande Kong PetscFunctionBegin; 3647a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3648a3bb6f32SFande Kong PetscValidPointer(mapping, 2); 3649a3bb6f32SFande Kong /* use a table */ 3650eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3651a3bb6f32SFande Kong ec = 0; 365225b670f0SStefano Zampini for (i = 0; i < nz; i++) { 365325b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3654eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3655a3bb6f32SFande Kong if (!data) { 3656a3bb6f32SFande Kong /* one based table */ 3657c76ffc5fSJacob Faibussowitsch PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec)); 3658a3bb6f32SFande Kong } 3659a3bb6f32SFande Kong } 3660a3bb6f32SFande Kong /* form array of columns we need */ 36619566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3662eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3663eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3664eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3665eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3666eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3667a3bb6f32SFande Kong gid--; 3668a3bb6f32SFande Kong lid--; 3669a3bb6f32SFande Kong garray[lid] = gid; 3670a3bb6f32SFande Kong } 36719566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3672eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3673c76ffc5fSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1)); 3674a3bb6f32SFande Kong /* compact out the extra columns in B */ 367525b670f0SStefano Zampini for (i = 0; i < nz; i++) { 367625b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3677eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3678a3bb6f32SFande Kong lid--; 367925b670f0SStefano Zampini jj[i] = lid; 3680a3bb6f32SFande Kong } 36819566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3682eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 36839566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36849566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36859566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 3686a3bb6f32SFande Kong PetscFunctionReturn(0); 3687a3bb6f32SFande Kong } 3688a3bb6f32SFande Kong 3689bef8e0ddSBarry Smith /*@ 3690bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3691bef8e0ddSBarry Smith in the matrix. 3692bef8e0ddSBarry Smith 3693bef8e0ddSBarry Smith Input Parameters: 369411a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3695bef8e0ddSBarry Smith - indices - the column indices 3696bef8e0ddSBarry Smith 369715091d37SBarry Smith Level: advanced 369815091d37SBarry Smith 3699bef8e0ddSBarry Smith Notes: 3700bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3701bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 370211a5261eSBarry Smith of the `MatSetValues()` operation. 3703bef8e0ddSBarry Smith 3704bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 370511a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3706bef8e0ddSBarry Smith 370711a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3708bef8e0ddSBarry Smith 3709b9617806SBarry Smith The indices should start with zero, not one. 3710b9617806SBarry Smith 3711bef8e0ddSBarry Smith @*/ 3712d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3713d71ae5a4SJacob Faibussowitsch { 3714bef8e0ddSBarry Smith PetscFunctionBegin; 37150700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3716dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 3717cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 3718bef8e0ddSBarry Smith PetscFunctionReturn(0); 3719bef8e0ddSBarry Smith } 3720bef8e0ddSBarry Smith 3721be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3722be6bf707SBarry Smith 3723d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3724d71ae5a4SJacob Faibussowitsch { 3725be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3726d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3727be6bf707SBarry Smith 3728be6bf707SBarry Smith PetscFunctionBegin; 372928b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3730be6bf707SBarry Smith 3731be6bf707SBarry Smith /* allocate space for values if not already there */ 37324dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3733be6bf707SBarry Smith 3734be6bf707SBarry Smith /* copy values over */ 37359566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 3736be6bf707SBarry Smith PetscFunctionReturn(0); 3737be6bf707SBarry Smith } 3738be6bf707SBarry Smith 3739be6bf707SBarry Smith /*@ 3740be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3741be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3742be6bf707SBarry Smith nonlinear portion. 3743be6bf707SBarry Smith 3744c3339decSBarry Smith Logically Collect 3745be6bf707SBarry Smith 3746be6bf707SBarry Smith Input Parameters: 374711a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3748be6bf707SBarry Smith 374915091d37SBarry Smith Level: advanced 375015091d37SBarry Smith 375111a5261eSBarry Smith Common Usage, with `SNESSolve()`: 3752be6bf707SBarry Smith $ Create Jacobian matrix 3753be6bf707SBarry Smith $ Set linear terms into matrix 3754be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3755be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3756be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3757512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3758be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3759be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3760be6bf707SBarry Smith $ In your Jacobian routine 3761be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3762be6bf707SBarry Smith $ Set nonlinear terms in matrix 3763be6bf707SBarry Smith 3764be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3765be6bf707SBarry Smith $ // build linear portion of Jacobian 3766512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3767be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3768be6bf707SBarry Smith $ loop over nonlinear iterations 3769be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3770be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3771be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3772be6bf707SBarry Smith $ Solve linear system with Jacobian 3773be6bf707SBarry Smith $ endloop 3774be6bf707SBarry Smith 3775be6bf707SBarry Smith Notes: 3776be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 377711a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3778be6bf707SBarry Smith calling this routine. 3779be6bf707SBarry Smith 37800c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37810c468ba9SBarry Smith and does not allocated additional space. 37820c468ba9SBarry Smith 3783db781477SPatrick Sanan .seealso: `MatRetrieveValues()` 3784be6bf707SBarry Smith @*/ 3785d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3786d71ae5a4SJacob Faibussowitsch { 3787be6bf707SBarry Smith PetscFunctionBegin; 37880700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 378928b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 379028b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3791cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 3792be6bf707SBarry Smith PetscFunctionReturn(0); 3793be6bf707SBarry Smith } 3794be6bf707SBarry Smith 3795d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3796d71ae5a4SJacob Faibussowitsch { 3797be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3798d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3799be6bf707SBarry Smith 3800be6bf707SBarry Smith PetscFunctionBegin; 380128b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 380228b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3803be6bf707SBarry Smith /* copy values over */ 38049566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 3805be6bf707SBarry Smith PetscFunctionReturn(0); 3806be6bf707SBarry Smith } 3807be6bf707SBarry Smith 3808be6bf707SBarry Smith /*@ 3809be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3810be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3811be6bf707SBarry Smith nonlinear portion. 3812be6bf707SBarry Smith 3813c3339decSBarry Smith Logically Collect 3814be6bf707SBarry Smith 3815be6bf707SBarry Smith Input Parameters: 381611a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3817be6bf707SBarry Smith 381815091d37SBarry Smith Level: advanced 381915091d37SBarry Smith 3820db781477SPatrick Sanan .seealso: `MatStoreValues()` 3821be6bf707SBarry Smith @*/ 3822d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3823d71ae5a4SJacob Faibussowitsch { 3824be6bf707SBarry Smith PetscFunctionBegin; 38250700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 382628b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 382728b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3828cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 3829be6bf707SBarry Smith PetscFunctionReturn(0); 3830be6bf707SBarry Smith } 3831be6bf707SBarry Smith 3832be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 383317ab2063SBarry Smith /*@C 383411a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38350d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 38366e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 383751c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 38382bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 383917ab2063SBarry Smith 3840d083f849SBarry Smith Collective 3841db81eaa0SLois Curfman McInnes 384217ab2063SBarry Smith Input Parameters: 384311a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 384417ab2063SBarry Smith . m - number of rows 384517ab2063SBarry Smith . n - number of columns 384617ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 384751c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38480298fd71SBarry Smith (possibly different for each row) or NULL 384917ab2063SBarry Smith 385017ab2063SBarry Smith Output Parameter: 3851416022c9SBarry Smith . A - the matrix 385217ab2063SBarry Smith 385311a5261eSBarry Smith It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 3854f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 385511a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 3856175b88e8SBarry Smith 3857b259b22eSLois Curfman McInnes Notes: 385849a6f317SBarry Smith If nnz is given then nz is ignored 385949a6f317SBarry Smith 386011a5261eSBarry Smith The AIJ format, also called 386111a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 38620002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 386344cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 386417ab2063SBarry Smith 386517ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 386611a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 38673d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 38686da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 386917ab2063SBarry Smith 3870682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38714fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3872682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38736c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38746c7ebb05SLois Curfman McInnes 38756c7ebb05SLois Curfman McInnes Options Database Keys: 3876698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 38779db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 387817ab2063SBarry Smith 3879027ccd11SLois Curfman McInnes Level: intermediate 3880027ccd11SLois Curfman McInnes 388160161072SBarry Smith .seealso: [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 388217ab2063SBarry Smith @*/ 3883d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3884d71ae5a4SJacob Faibussowitsch { 38853a40ed3dSBarry Smith PetscFunctionBegin; 38869566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38879566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38889566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 3890273d9f13SBarry Smith PetscFunctionReturn(0); 3891273d9f13SBarry Smith } 3892273d9f13SBarry Smith 3893273d9f13SBarry Smith /*@C 3894273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3895273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3896273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3897273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3898273d9f13SBarry Smith 3899d083f849SBarry Smith Collective 3900273d9f13SBarry Smith 3901273d9f13SBarry Smith Input Parameters: 39021c4f3114SJed Brown + B - The matrix 3903273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3904273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39050298fd71SBarry Smith (possibly different for each row) or NULL 3906273d9f13SBarry Smith 3907273d9f13SBarry Smith Notes: 390849a6f317SBarry Smith If nnz is given then nz is ignored 390949a6f317SBarry Smith 391011a5261eSBarry Smith The `MATSEQAIJ` format also called 391111a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 3912273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3913273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3914273d9f13SBarry Smith 3915273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 391611a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 3917273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3918273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3919273d9f13SBarry Smith 392011a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3921aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3922aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3923aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3924aa95bbe8SBarry Smith 392511a5261eSBarry Smith Developer Notes: 392611a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3927a96a251dSBarry Smith entries or columns indices 3928a96a251dSBarry Smith 3929273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3930273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3931273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3932273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3933273d9f13SBarry Smith 3934273d9f13SBarry Smith Options Database Keys: 3935698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 393647b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3937273d9f13SBarry Smith 3938273d9f13SBarry Smith Level: intermediate 3939273d9f13SBarry Smith 3940db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3941db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3942273d9f13SBarry Smith @*/ 3943d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3944d71ae5a4SJacob Faibussowitsch { 3945a23d5eceSKris Buschelman PetscFunctionBegin; 39466ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39476ba663aaSJed Brown PetscValidType(B, 1); 3948cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 3949a23d5eceSKris Buschelman PetscFunctionReturn(0); 3950a23d5eceSKris Buschelman } 3951a23d5eceSKris Buschelman 3952d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3953d71ae5a4SJacob Faibussowitsch { 3954273d9f13SBarry Smith Mat_SeqAIJ *b; 39552576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 395697f1f81fSBarry Smith PetscInt i; 3957273d9f13SBarry Smith 3958273d9f13SBarry Smith PetscFunctionBegin; 39592576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3960a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3961c461c341SBarry Smith skipallocation = PETSC_TRUE; 3962c461c341SBarry Smith nz = 0; 3963c461c341SBarry Smith } 39649566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39659566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3966899cda47SBarry Smith 3967435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 396808401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 3969cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3970d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 397108401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 397208401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3973b73539f3SBarry Smith } 3974b73539f3SBarry Smith } 3975b73539f3SBarry Smith 3976273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 39772205254eSKarl Rupp 3978273d9f13SBarry Smith b = (Mat_SeqAIJ *)B->data; 3979273d9f13SBarry Smith 3980ab93d7beSBarry Smith if (!skipallocation) { 39814dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3982071fcb05SBarry Smith if (!b->ilen) { 3983071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39849566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3985071fcb05SBarry Smith } else { 39869566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39872ee49352SLisandro Dalcin } 39884dfa11a4SJacob Faibussowitsch if (!b->ipre) { PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); } 3989273d9f13SBarry Smith if (!nnz) { 3990435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3991c62bd62aSJed Brown else if (nz < 0) nz = 1; 39925d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 3993d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 3994d0f46423SBarry Smith nz = nz * B->rmap->n; 3995273d9f13SBarry Smith } else { 3996c73702f5SBarry Smith PetscInt64 nz64 = 0; 39979371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 39989371c9d4SSatish Balay b->imax[i] = nnz[i]; 39999371c9d4SSatish Balay nz64 += nnz[i]; 40009371c9d4SSatish Balay } 40019566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 4002273d9f13SBarry Smith } 4003ab93d7beSBarry Smith 4004273d9f13SBarry Smith /* allocate the matrix space */ 400553dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 40069566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 4007396832f4SHong Zhang if (B->structure_only) { 40089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &b->j)); 40099566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i)); 4010396832f4SHong Zhang } else { 40119566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i)); 4012396832f4SHong Zhang } 4013bfeeae90SHong Zhang b->i[0] = 0; 4014ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4015396832f4SHong Zhang if (B->structure_only) { 4016396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4017396832f4SHong Zhang b->free_a = PETSC_FALSE; 4018396832f4SHong Zhang } else { 4019273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4020e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4021396832f4SHong Zhang } 4022e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4023c461c341SBarry Smith } else { 4024e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4025e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4026c461c341SBarry Smith } 4027273d9f13SBarry Smith 4028846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4029846b4da1SFande Kong /* reserve user-requested sparsity */ 40309566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4031846b4da1SFande Kong } 4032846b4da1SFande Kong 4033273d9f13SBarry Smith b->nz = 0; 4034273d9f13SBarry Smith b->maxnz = nz; 4035273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40361baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4037cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4038cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40395519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40405519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40415519a089SJose E. Roman */ 40425519a089SJose E. Roman B->nonzerostate++; 4043273d9f13SBarry Smith PetscFunctionReturn(0); 4044273d9f13SBarry Smith } 4045273d9f13SBarry Smith 4046d71ae5a4SJacob Faibussowitsch PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4047d71ae5a4SJacob Faibussowitsch { 4048846b4da1SFande Kong Mat_SeqAIJ *a; 4049a5bbaf83SFande Kong PetscInt i; 4050846b4da1SFande Kong 4051846b4da1SFande Kong PetscFunctionBegin; 4052846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 405314d0e64fSAlex Lindsay 405414d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 405514d0e64fSAlex Lindsay if (!A->rmap->n) PetscFunctionReturn(0); 405614d0e64fSAlex Lindsay 4057846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40582c814fdeSFande Kong /* if no saved info, we error out */ 405928b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40602c814fdeSFande Kong 4061aed4548fSBarry Smith PetscCheck(a->i && a->j && a->a && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40622c814fdeSFande Kong 40639566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40649566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4065846b4da1SFande Kong a->i[0] = 0; 4066ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4067846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4068846b4da1SFande Kong a->nz = 0; 4069846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4070846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4071846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4072846b4da1SFande Kong A->assembled = PETSC_FALSE; 4073846b4da1SFande Kong PetscFunctionReturn(0); 4074846b4da1SFande Kong } 4075846b4da1SFande Kong 407658d36128SBarry Smith /*@ 407711a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4078a1661176SMatthew Knepley 4079a1661176SMatthew Knepley Input Parameters: 4080a1661176SMatthew Knepley + B - the matrix 4081a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4082a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4083a1661176SMatthew Knepley - v - optional values in the matrix 4084a1661176SMatthew Knepley 4085a1661176SMatthew Knepley Level: developer 4086a1661176SMatthew Knepley 40876a9b8d82SBarry Smith Notes: 408811a5261eSBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 408958d36128SBarry Smith 40906a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 40916a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 40926a9b8d82SBarry Smith 40936a9b8d82SBarry Smith Developer Notes: 40946a9b8d82SBarry Smith An optimization could be added to the implementation where it checks if the i, and j are identical to the current i and j and 409511a5261eSBarry Smith then just copies the v values directly with `PetscMemcpy()`. 40966a9b8d82SBarry Smith 409711a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 40986a9b8d82SBarry Smith 4099db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MatResetPreallocation()` 4100a1661176SMatthew Knepley @*/ 4101d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4102d71ae5a4SJacob Faibussowitsch { 4103a1661176SMatthew Knepley PetscFunctionBegin; 41040700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 41056ba663aaSJed Brown PetscValidType(B, 1); 4106cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 4107a1661176SMatthew Knepley PetscFunctionReturn(0); 4108a1661176SMatthew Knepley } 4109a1661176SMatthew Knepley 4110d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4111d71ae5a4SJacob Faibussowitsch { 4112a1661176SMatthew Knepley PetscInt i; 4113a1661176SMatthew Knepley PetscInt m, n; 4114a1661176SMatthew Knepley PetscInt nz; 41156a9b8d82SBarry Smith PetscInt *nnz; 4116a1661176SMatthew Knepley 4117a1661176SMatthew Knepley PetscFunctionBegin; 4118aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4119779a8d59SSatish Balay 41209566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41219566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4122779a8d59SSatish Balay 41239566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41249566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4125a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4126b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 412708401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4128a1661176SMatthew Knepley nnz[i] = nz; 4129a1661176SMatthew Knepley } 41309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41319566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4132a1661176SMatthew Knepley 413348a46eb9SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES)); 4134a1661176SMatthew Knepley 41359566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41369566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4137a1661176SMatthew Knepley 41389566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 4139a1661176SMatthew Knepley PetscFunctionReturn(0); 4140a1661176SMatthew Knepley } 4141a1661176SMatthew Knepley 4142ad7e164aSPierre Jolivet /*@ 4143ad7e164aSPierre Jolivet MatSeqAIJKron - Computes C, the Kronecker product of A and B. 4144ad7e164aSPierre Jolivet 4145ad7e164aSPierre Jolivet Input Parameters: 4146ad7e164aSPierre Jolivet + A - left-hand side matrix 4147ad7e164aSPierre Jolivet . B - right-hand side matrix 414811a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4149ad7e164aSPierre Jolivet 4150ad7e164aSPierre Jolivet Output Parameter: 4151ad7e164aSPierre Jolivet . C - Kronecker product of A and B 4152ad7e164aSPierre Jolivet 4153ad7e164aSPierre Jolivet Level: intermediate 4154ad7e164aSPierre Jolivet 415511a5261eSBarry Smith Note: 415611a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4157ad7e164aSPierre Jolivet 4158db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4159ad7e164aSPierre Jolivet @*/ 4160d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4161d71ae5a4SJacob Faibussowitsch { 4162ad7e164aSPierre Jolivet PetscFunctionBegin; 4163ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4164ad7e164aSPierre Jolivet PetscValidType(A, 1); 4165ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4166ad7e164aSPierre Jolivet PetscValidType(B, 2); 4167ad7e164aSPierre Jolivet PetscValidPointer(C, 4); 4168ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4169ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4170ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4171ad7e164aSPierre Jolivet } 4172cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 4173ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4174ad7e164aSPierre Jolivet } 4175ad7e164aSPierre Jolivet 4176d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4177d71ae5a4SJacob Faibussowitsch { 4178ad7e164aSPierre Jolivet Mat newmat; 4179ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4180ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4181ad7e164aSPierre Jolivet PetscScalar *v; 4182fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4183ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4184ad7e164aSPierre Jolivet PetscBool flg; 4185ad7e164aSPierre Jolivet 4186ad7e164aSPierre Jolivet PetscFunctionBegin; 418728b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 418828b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 418928b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 419028b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 41919566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 419228b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4193aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4194ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 41959566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 41969566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 41979566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 41989566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4199ad7e164aSPierre Jolivet i[0] = 0; 4200ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4201ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4202ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4203ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4204ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4205ad7e164aSPierre Jolivet } 4206ad7e164aSPierre Jolivet } 4207ad7e164aSPierre Jolivet } 42089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4209ad7e164aSPierre Jolivet *C = newmat; 42109566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4211ad7e164aSPierre Jolivet nnz = 0; 4212ad7e164aSPierre Jolivet } 42139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4216ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4217ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4218ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4219ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4220ad7e164aSPierre Jolivet } 4221ad7e164aSPierre Jolivet } 4222ad7e164aSPierre Jolivet } 42239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 4226ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4227ad7e164aSPierre Jolivet } 4228ad7e164aSPierre Jolivet 4229c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4230af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4231170fe5c8SBarry Smith 4232170fe5c8SBarry Smith /* 4233170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4234170fe5c8SBarry Smith 4235170fe5c8SBarry Smith n p p 42362da392ccSBarry Smith [ ] [ ] [ ] 42372da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42382da392ccSBarry Smith [ ] [ ] [ ] 4239170fe5c8SBarry Smith 4240170fe5c8SBarry Smith */ 4241d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4242d71ae5a4SJacob Faibussowitsch { 4243170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4244170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4245170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 424686214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4247170fe5c8SBarry Smith const PetscInt *ii, *idx; 4248170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4249170fe5c8SBarry Smith PetscScalar *c, *c_q; 425086214ceeSStefano Zampini PetscInt clda = sub_c->lda; 425186214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4252170fe5c8SBarry Smith 4253170fe5c8SBarry Smith PetscFunctionBegin; 4254d0f46423SBarry Smith m = A->rmap->n; 4255d0f46423SBarry Smith n = A->cmap->n; 4256d0f46423SBarry Smith p = B->cmap->n; 4257170fe5c8SBarry Smith a = sub_a->v; 4258170fe5c8SBarry Smith b = sub_b->a; 4259170fe5c8SBarry Smith c = sub_c->v; 426086214ceeSStefano Zampini if (clda == m) { 42619566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 426286214ceeSStefano Zampini } else { 426386214ceeSStefano Zampini for (j = 0; j < p; j++) 42649371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 426586214ceeSStefano Zampini } 4266170fe5c8SBarry Smith ii = sub_b->i; 4267170fe5c8SBarry Smith idx = sub_b->j; 4268170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4269170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4270170fe5c8SBarry Smith while (q-- > 0) { 427186214ceeSStefano Zampini c_q = c + clda * (*idx); 427286214ceeSStefano Zampini a_q = a + alda * i; 4273854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4274170fe5c8SBarry Smith idx++; 4275170fe5c8SBarry Smith b++; 4276170fe5c8SBarry Smith } 4277170fe5c8SBarry Smith } 4278170fe5c8SBarry Smith PetscFunctionReturn(0); 4279170fe5c8SBarry Smith } 4280170fe5c8SBarry Smith 4281d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4282d71ae5a4SJacob Faibussowitsch { 4283d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 428486214ceeSStefano Zampini PetscBool cisdense; 4285170fe5c8SBarry Smith 4286170fe5c8SBarry Smith PetscFunctionBegin; 428708401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 42889566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 42899566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 4290d5e393b6SSuyash Tandon PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, "")); 429148a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 42929566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4293d73949e8SHong Zhang 42944222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 4295170fe5c8SBarry Smith PetscFunctionReturn(0); 4296170fe5c8SBarry Smith } 4297170fe5c8SBarry Smith 4298170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 42990bad9183SKris Buschelman /*MC 4300fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43010bad9183SKris Buschelman based on compressed sparse row format. 43020bad9183SKris Buschelman 43030bad9183SKris Buschelman Options Database Keys: 43040bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43050bad9183SKris Buschelman 43060bad9183SKris Buschelman Level: beginner 43070bad9183SKris Buschelman 43080cd7f59aSBarry Smith Notes: 430911a5261eSBarry Smith `MatSetValues()` may be called for this matrix type with a NULL argument for the numerical values, 43100cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43110cd7f59aSBarry Smith in the matrix 43120cd7f59aSBarry Smith 431311a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 431411a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43150cd7f59aSBarry Smith 431611a5261eSBarry Smith Developer Note: 43170cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 43180cd7f59aSBarry Smith 4319db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43200bad9183SKris Buschelman M*/ 43210bad9183SKris Buschelman 4322ccd284c7SBarry Smith /*MC 4323ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4324ccd284c7SBarry Smith 432511a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 432611a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 432711a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4328ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4329ccd284c7SBarry Smith the above preallocation routines for simplicity. 4330ccd284c7SBarry Smith 4331ccd284c7SBarry Smith Options Database Keys: 433211a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4333ccd284c7SBarry Smith 433411a5261eSBarry Smith Note: 433511a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4336ccd284c7SBarry Smith enough exist. 4337ccd284c7SBarry Smith 4338ccd284c7SBarry Smith Level: beginner 4339ccd284c7SBarry Smith 4340db781477SPatrick Sanan .seealso: `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4341ccd284c7SBarry Smith M*/ 4342ccd284c7SBarry Smith 4343ccd284c7SBarry Smith /*MC 4344ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4345ccd284c7SBarry Smith 434611a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 434711a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 434811a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4349ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4350ccd284c7SBarry Smith the above preallocation routines for simplicity. 4351ccd284c7SBarry Smith 4352ccd284c7SBarry Smith Options Database Keys: 435311a5261eSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 4354ccd284c7SBarry Smith 4355ccd284c7SBarry Smith Level: beginner 4356ccd284c7SBarry Smith 4357c2e3fba1SPatrick Sanan .seealso: `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4358ccd284c7SBarry Smith M*/ 4359ccd284c7SBarry Smith 43607906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43617906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43627906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43637906f579SHong Zhang #endif 4364d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4365d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4366d24d4204SJose E. Roman #endif 43677906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43687906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43697906f579SHong Zhang #endif 43707906f579SHong Zhang 4371d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4372c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43734222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43747906f579SHong Zhang 43758c778c55SBarry Smith /*@C 437611a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43778c778c55SBarry Smith 43788c778c55SBarry Smith Not Collective 43798c778c55SBarry Smith 43808c778c55SBarry Smith Input Parameter: 438111a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 43828c778c55SBarry Smith 43838c778c55SBarry Smith Output Parameter: 43848c778c55SBarry Smith . array - pointer to the data 43858c778c55SBarry Smith 43868c778c55SBarry Smith Level: intermediate 43878c778c55SBarry Smith 4388*0ab4885dSBarry Smith Fortran Note: 4389*0ab4885dSBarry Smith `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()` 4390*0ab4885dSBarry Smith 4391db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 43928c778c55SBarry Smith @*/ 4393d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array) 4394d71ae5a4SJacob Faibussowitsch { 4395d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 43968c778c55SBarry Smith 43978c778c55SBarry Smith PetscFunctionBegin; 4398d67d9f35SJunchao Zhang if (aij->ops->getarray) { 43999566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4400d67d9f35SJunchao Zhang } else { 4401d67d9f35SJunchao Zhang *array = aij->a; 4402d67d9f35SJunchao Zhang } 4403d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4404d67d9f35SJunchao Zhang } 4405d67d9f35SJunchao Zhang 4406d67d9f35SJunchao Zhang /*@C 440711a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4408d67d9f35SJunchao Zhang 4409d67d9f35SJunchao Zhang Not Collective 4410d67d9f35SJunchao Zhang 4411d67d9f35SJunchao Zhang Input Parameters: 441211a5261eSBarry Smith + mat - a `MATSEQAIJ` matrix 4413d67d9f35SJunchao Zhang - array - pointer to the data 4414d67d9f35SJunchao Zhang 4415d67d9f35SJunchao Zhang Level: intermediate 4416d67d9f35SJunchao Zhang 4417*0ab4885dSBarry Smith Fortran Note: 4418*0ab4885dSBarry Smith `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()` 4419*0ab4885dSBarry Smith 4420db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4421d67d9f35SJunchao Zhang @*/ 4422d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array) 4423d71ae5a4SJacob Faibussowitsch { 4424d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4425d67d9f35SJunchao Zhang 4426d67d9f35SJunchao Zhang PetscFunctionBegin; 4427d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44289566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4429d67d9f35SJunchao Zhang } else { 4430d67d9f35SJunchao Zhang *array = NULL; 4431d67d9f35SJunchao Zhang } 44329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44339566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44348c778c55SBarry Smith PetscFunctionReturn(0); 44358c778c55SBarry Smith } 44368c778c55SBarry Smith 443721e72a00SBarry Smith /*@C 443811a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44398f1ea47aSStefano Zampini 4440*0ab4885dSBarry Smith Not Collective; No Fortran Support 44418f1ea47aSStefano Zampini 44428f1ea47aSStefano Zampini Input Parameter: 444311a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44448f1ea47aSStefano Zampini 44458f1ea47aSStefano Zampini Output Parameter: 44468f1ea47aSStefano Zampini . array - pointer to the data 44478f1ea47aSStefano Zampini 44488f1ea47aSStefano Zampini Level: intermediate 44498f1ea47aSStefano Zampini 4450db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44518f1ea47aSStefano Zampini @*/ 4452d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array) 4453d71ae5a4SJacob Faibussowitsch { 4454d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44558f1ea47aSStefano Zampini 44568f1ea47aSStefano Zampini PetscFunctionBegin; 4457d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44589566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4459d67d9f35SJunchao Zhang } else { 4460d67d9f35SJunchao Zhang *array = aij->a; 4461d67d9f35SJunchao Zhang } 44628f1ea47aSStefano Zampini PetscFunctionReturn(0); 44638f1ea47aSStefano Zampini } 44648f1ea47aSStefano Zampini 44658f1ea47aSStefano Zampini /*@C 446611a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44678f1ea47aSStefano Zampini 4468*0ab4885dSBarry Smith Not Collective; No Fortran Support 44698f1ea47aSStefano Zampini 44708f1ea47aSStefano Zampini Input Parameter: 447111a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44728f1ea47aSStefano Zampini 44738f1ea47aSStefano Zampini Output Parameter: 44748f1ea47aSStefano Zampini . array - pointer to the data 44758f1ea47aSStefano Zampini 44768f1ea47aSStefano Zampini Level: intermediate 44778f1ea47aSStefano Zampini 4478db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44798f1ea47aSStefano Zampini @*/ 4480d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array) 4481d71ae5a4SJacob Faibussowitsch { 4482d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44838f1ea47aSStefano Zampini 44848f1ea47aSStefano Zampini PetscFunctionBegin; 4485d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44869566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4487d67d9f35SJunchao Zhang } else { 4488d67d9f35SJunchao Zhang *array = NULL; 4489d67d9f35SJunchao Zhang } 4490d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4491d67d9f35SJunchao Zhang } 4492d67d9f35SJunchao Zhang 4493d67d9f35SJunchao Zhang /*@C 449411a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4495d67d9f35SJunchao Zhang 4496*0ab4885dSBarry Smith Not Collective; No Fortran Support 4497d67d9f35SJunchao Zhang 4498d67d9f35SJunchao Zhang Input Parameter: 449911a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 4500d67d9f35SJunchao Zhang 4501d67d9f35SJunchao Zhang Output Parameter: 4502d67d9f35SJunchao Zhang . array - pointer to the data 4503d67d9f35SJunchao Zhang 4504d67d9f35SJunchao Zhang Level: intermediate 4505d67d9f35SJunchao Zhang 4506db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4507d67d9f35SJunchao Zhang @*/ 4508d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array) 4509d71ae5a4SJacob Faibussowitsch { 4510d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4511d67d9f35SJunchao Zhang 4512d67d9f35SJunchao Zhang PetscFunctionBegin; 4513d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45149566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4515d67d9f35SJunchao Zhang } else { 4516d67d9f35SJunchao Zhang *array = aij->a; 4517d67d9f35SJunchao Zhang } 45189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45199566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 4520d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4521d67d9f35SJunchao Zhang } 4522d67d9f35SJunchao Zhang 4523d67d9f35SJunchao Zhang /*@C 4524d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4525d67d9f35SJunchao Zhang 4526*0ab4885dSBarry Smith Not Collective; No Fortran Support 4527d67d9f35SJunchao Zhang 4528d67d9f35SJunchao Zhang Input Parameter: 4529d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4530d67d9f35SJunchao Zhang 4531d67d9f35SJunchao Zhang Output Parameter: 4532d67d9f35SJunchao Zhang . array - pointer to the data 4533d67d9f35SJunchao Zhang 4534d67d9f35SJunchao Zhang Level: intermediate 4535d67d9f35SJunchao Zhang 4536db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4537d67d9f35SJunchao Zhang @*/ 4538d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array) 4539d71ae5a4SJacob Faibussowitsch { 4540d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4541d67d9f35SJunchao Zhang 4542d67d9f35SJunchao Zhang PetscFunctionBegin; 4543d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45449566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4545d67d9f35SJunchao Zhang } else { 4546d67d9f35SJunchao Zhang *array = NULL; 4547d67d9f35SJunchao Zhang } 45488f1ea47aSStefano Zampini PetscFunctionReturn(0); 45498f1ea47aSStefano Zampini } 45508f1ea47aSStefano Zampini 45518f1ea47aSStefano Zampini /*@C 455211a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45537ee59b9bSJunchao Zhang 4554*0ab4885dSBarry Smith Not Collective; No Fortran Support 45557ee59b9bSJunchao Zhang 45567ee59b9bSJunchao Zhang Input Parameter: 455711a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45587ee59b9bSJunchao Zhang 45597ee59b9bSJunchao Zhang Output Parameters: 45607ee59b9bSJunchao Zhang + i - row map array of the matrix 45617ee59b9bSJunchao Zhang . j - column index array of the matrix 45627ee59b9bSJunchao Zhang . a - data array of the matrix 45637ee59b9bSJunchao Zhang - memtype - memory type of the arrays 45647ee59b9bSJunchao Zhang 45657ee59b9bSJunchao Zhang Notes: 45667ee59b9bSJunchao Zhang Any of the output parameters can be NULL, in which case the corresponding value is not returned. 45677ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45687ee59b9bSJunchao Zhang 45697ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45707ee59b9bSJunchao Zhang If the matrix is assembled, the data array 'a' is guaranteed to have the latest values of the matrix. 45717ee59b9bSJunchao Zhang 45727ee59b9bSJunchao Zhang Level: Developer 45737ee59b9bSJunchao Zhang 4574db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45757ee59b9bSJunchao Zhang @*/ 4576d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype) 4577d71ae5a4SJacob Faibussowitsch { 45787ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45797ee59b9bSJunchao Zhang 45807ee59b9bSJunchao Zhang PetscFunctionBegin; 45817ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45827ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45837ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45847ee59b9bSJunchao Zhang } else { 45857ee59b9bSJunchao Zhang if (i) *i = aij->i; 45867ee59b9bSJunchao Zhang if (j) *j = aij->j; 45877ee59b9bSJunchao Zhang if (a) *a = aij->a; 45887ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 45897ee59b9bSJunchao Zhang } 45907ee59b9bSJunchao Zhang PetscFunctionReturn(0); 45917ee59b9bSJunchao Zhang } 45927ee59b9bSJunchao Zhang 45937ee59b9bSJunchao Zhang /*@C 459421e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 459521e72a00SBarry Smith 459621e72a00SBarry Smith Not Collective 459721e72a00SBarry Smith 459821e72a00SBarry Smith Input Parameter: 459911a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 460021e72a00SBarry Smith 460121e72a00SBarry Smith Output Parameter: 460221e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 460321e72a00SBarry Smith 460421e72a00SBarry Smith Level: intermediate 460521e72a00SBarry Smith 4606db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 460721e72a00SBarry Smith @*/ 4608d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4609d71ae5a4SJacob Faibussowitsch { 461021e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 461121e72a00SBarry Smith 461221e72a00SBarry Smith PetscFunctionBegin; 461321e72a00SBarry Smith *nz = aij->rmax; 461421e72a00SBarry Smith PetscFunctionReturn(0); 461521e72a00SBarry Smith } 461621e72a00SBarry Smith 4617d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4618d71ae5a4SJacob Faibussowitsch { 4619394ed5ebSJunchao Zhang MPI_Comm comm; 4620394ed5ebSJunchao Zhang PetscInt *i, *j; 4621394ed5ebSJunchao Zhang PetscInt M, N, row; 4622394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4623394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4624394ed5ebSJunchao Zhang PetscInt *Aj; 4625394ed5ebSJunchao Zhang PetscScalar *Aa; 4626cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)(mat->data); 4627cbc6b225SStefano Zampini MatType rtype; 4628394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 4629394ed5ebSJunchao Zhang 4630394ed5ebSJunchao Zhang PetscFunctionBegin; 46319566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(mat)); 46329566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46339566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4634e8729f6fSJunchao Zhang i = coo_i; 4635e8729f6fSJunchao Zhang j = coo_j; 46369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 4637394ed5ebSJunchao Zhang for (k = 0; k < coo_n; k++) { /* Ignore entries with negative row or col indices */ 4638394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4639394ed5ebSJunchao Zhang perm[k] = k; 4640394ed5ebSJunchao Zhang } 4641394ed5ebSJunchao Zhang 4642394ed5ebSJunchao Zhang /* Sort by row */ 46439566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 46449371c9d4SSatish Balay for (k = 0; k < coo_n; k++) { 46459371c9d4SSatish Balay if (i[k] >= 0) break; 46469371c9d4SSatish Balay } /* Advance k to the first row with a non-negative index */ 4647394ed5ebSJunchao Zhang nneg = k; 46489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4649394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 4650394ed5ebSJunchao Zhang jmap++; /* Inc jmap by 1 for convinience */ 4651394ed5ebSJunchao Zhang 46529566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M + 1, &Ai)); /* CSR of A */ 46539566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4654394ed5ebSJunchao Zhang 4655394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 4656394ed5ebSJunchao Zhang Ai++; /* Inc by 1 for convinience */ 4657394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4658394ed5ebSJunchao Zhang while (k < coo_n) { 4659394ed5ebSJunchao Zhang row = i[k]; 4660394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4661394ed5ebSJunchao Zhang while (k < coo_n && i[k] == row) k++; 4662394ed5ebSJunchao Zhang end = k; 46639566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4664394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4665394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4666394ed5ebSJunchao Zhang jmap[q] = 1; /* Number of repeats of this nozero entry */ 4667394ed5ebSJunchao Zhang Ai[row] = 1; 4668394ed5ebSJunchao Zhang nnz++; 4669394ed5ebSJunchao Zhang 4670394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4671394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4672394ed5ebSJunchao Zhang q++; 4673394ed5ebSJunchao Zhang jmap[q] = 1; 4674394ed5ebSJunchao Zhang Aj[q] = j[p]; 4675394ed5ebSJunchao Zhang Ai[row]++; 4676394ed5ebSJunchao Zhang nnz++; 4677394ed5ebSJunchao Zhang } else { 4678394ed5ebSJunchao Zhang jmap[q]++; 4679394ed5ebSJunchao Zhang } 4680394ed5ebSJunchao Zhang } 4681394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4682394ed5ebSJunchao Zhang } 4683394ed5ebSJunchao Zhang 4684394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4685394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 4686394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4687394ed5ebSJunchao Zhang jmap[0] = 0; 4688394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 4689394ed5ebSJunchao Zhang if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */ 4690394ed5ebSJunchao Zhang PetscCount *jmap_new; 4691394ed5ebSJunchao Zhang PetscInt *Aj_new; 4692394ed5ebSJunchao Zhang 46939566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 46949566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 46959566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4696394ed5ebSJunchao Zhang jmap = jmap_new; 4697394ed5ebSJunchao Zhang 46989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &Aj_new)); 46999566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 47009566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4701394ed5ebSJunchao Zhang Aj = Aj_new; 4702394ed5ebSJunchao Zhang } 4703394ed5ebSJunchao Zhang 4704394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4705394ed5ebSJunchao Zhang PetscCount *perm_new; 4706cbc6b225SStefano Zampini 47079566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 47089566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 47099566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4710394ed5ebSJunchao Zhang perm = perm_new; 4711394ed5ebSJunchao Zhang } 4712394ed5ebSJunchao Zhang 47139566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 47149566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */ 47159566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4716394ed5ebSJunchao Zhang 4717394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4718394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 4719394ed5ebSJunchao Zhang /* Record COO fields */ 4720394ed5ebSJunchao Zhang seqaij->coo_n = coo_n; 4721394ed5ebSJunchao Zhang seqaij->Atot = coo_n - nneg; /* Annz is seqaij->nz, so no need to record that again */ 4722394ed5ebSJunchao Zhang seqaij->jmap = jmap; /* of length nnz+1 */ 4723394ed5ebSJunchao Zhang seqaij->perm = perm; 4724394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4725394ed5ebSJunchao Zhang } 4726394ed5ebSJunchao Zhang 4727d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4728d71ae5a4SJacob Faibussowitsch { 4729394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4730394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 4731394ed5ebSJunchao Zhang PetscCount *perm = aseq->perm, *jmap = aseq->jmap; 4732394ed5ebSJunchao Zhang PetscScalar *Aa; 4733394ed5ebSJunchao Zhang 4734394ed5ebSJunchao Zhang PetscFunctionBegin; 47359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4736394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4737b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4738b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4739b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4740394ed5ebSJunchao Zhang } 47419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 4742394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4743394ed5ebSJunchao Zhang } 4744394ed5ebSJunchao Zhang 474534b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47465063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 474702fe1965SBarry Smith #endif 4748d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4749d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *); 4750d5e393b6SSuyash Tandon #endif 47513d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47525063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 47533d0639e7SStefano Zampini #endif 475402fe1965SBarry Smith 4755d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4756d71ae5a4SJacob Faibussowitsch { 4757273d9f13SBarry Smith Mat_SeqAIJ *b; 475838baddfdSBarry Smith PetscMPIInt size; 4759273d9f13SBarry Smith 4760273d9f13SBarry Smith PetscFunctionBegin; 47619566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 476208401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4763273d9f13SBarry Smith 47644dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 47652205254eSKarl Rupp 4766b0a32e0cSBarry Smith B->data = (void *)b; 47672205254eSKarl Rupp 47689566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps))); 4769071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 47702205254eSKarl Rupp 4771f4259b30SLisandro Dalcin b->row = NULL; 4772f4259b30SLisandro Dalcin b->col = NULL; 4773f4259b30SLisandro Dalcin b->icol = NULL; 4774b810aeb4SBarry Smith b->reallocs = 0; 477536db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4776f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4777416022c9SBarry Smith b->nonew = 0; 4778f4259b30SLisandro Dalcin b->diag = NULL; 4779f4259b30SLisandro Dalcin b->solve_work = NULL; 4780f4259b30SLisandro Dalcin B->spptr = NULL; 4781f4259b30SLisandro Dalcin b->saved_values = NULL; 4782f4259b30SLisandro Dalcin b->idiag = NULL; 4783f4259b30SLisandro Dalcin b->mdiag = NULL; 4784f4259b30SLisandro Dalcin b->ssor_work = NULL; 478571f1c65dSBarry Smith b->omega = 1.0; 478671f1c65dSBarry Smith b->fshift = 0.0; 478771f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4788bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4789a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 479017ab2063SBarry Smith 47919566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4792d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 47939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 47949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4795b3866ffcSBarry Smith #endif 47969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 47979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 47989566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 47999566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 48009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 48019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 48029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 48039779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 48049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4805191b95cbSRichard Tran Mills #endif 480634b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 48089566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 481002fe1965SBarry Smith #endif 4811d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4812d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 4813d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 4814d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ)); 4815d5e393b6SSuyash Tandon #endif 48163d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48179566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 48183d0639e7SStefano Zampini #endif 48199566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4820af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 48219566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4822af8000cdSHong Zhang #endif 4823d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 48249566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4825d24d4204SJose E. Roman #endif 482663c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 48279566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 48289566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 482963c07aadSStefano Zampini #endif 48309566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 48319566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 48329566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 48339566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 48349566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsTranspose_SeqAIJ)); 48359566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 48369566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 48379566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 48389566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 48399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 48409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 48419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 48439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 48449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 48459566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 48469566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 48479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 48483a40ed3dSBarry Smith PetscFunctionReturn(0); 484917ab2063SBarry Smith } 485017ab2063SBarry Smith 4851b24902e0SBarry Smith /* 48523893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4853b24902e0SBarry Smith */ 4854d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4855d71ae5a4SJacob Faibussowitsch { 48562a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4857071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 485817ab2063SBarry Smith 48593a40ed3dSBarry Smith PetscFunctionBegin; 4860aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4861273d9f13SBarry Smith 4862d5f3da31SBarry Smith C->factortype = A->factortype; 4863f4259b30SLisandro Dalcin c->row = NULL; 4864f4259b30SLisandro Dalcin c->col = NULL; 4865f4259b30SLisandro Dalcin c->icol = NULL; 48666ad4291fSHong Zhang c->reallocs = 0; 486717ab2063SBarry Smith 486869272f91SPierre Jolivet C->assembled = A->assembled; 486969272f91SPierre Jolivet C->preallocated = A->preallocated; 487017ab2063SBarry Smith 487169272f91SPierre Jolivet if (A->preallocated) { 48729566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 48739566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4874eec197d1SBarry Smith 48759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 48769566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 48779566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 48789566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 487917ab2063SBarry Smith 488017ab2063SBarry Smith /* allocate the matrix space */ 4881f77e22a1SHong Zhang if (mallocmatspace) { 48829566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i)); 48832205254eSKarl Rupp 4884f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 48852205254eSKarl Rupp 48869566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 488717ab2063SBarry Smith if (m > 0) { 48889566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4889be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 48902e5835c6SStefano Zampini const PetscScalar *aa; 48912e5835c6SStefano Zampini 48929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 48939566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 48949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 4895be6bf707SBarry Smith } else { 48969566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 489717ab2063SBarry Smith } 489808480c60SBarry Smith } 4899f77e22a1SHong Zhang } 490017ab2063SBarry Smith 49016ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4902416022c9SBarry Smith c->roworiented = a->roworiented; 4903416022c9SBarry Smith c->nonew = a->nonew; 4904416022c9SBarry Smith if (a->diag) { 49059566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 49069566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 4907071fcb05SBarry Smith } else c->diag = NULL; 49082205254eSKarl Rupp 4909f4259b30SLisandro Dalcin c->solve_work = NULL; 4910f4259b30SLisandro Dalcin c->saved_values = NULL; 4911f4259b30SLisandro Dalcin c->idiag = NULL; 4912f4259b30SLisandro Dalcin c->ssor_work = NULL; 4913a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4914e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4915e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 49166ad4291fSHong Zhang 4917893ad86cSHong Zhang c->rmax = a->rmax; 4918416022c9SBarry Smith c->nz = a->nz; 49198ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4920754ec7b1SSatish Balay 49216ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 49226ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4923cd6b891eSBarry Smith if (a->compressedrow.use) { 49246ad4291fSHong Zhang i = a->compressedrow.nrows; 49259566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 49269566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 49279566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 492827ea64f8SHong Zhang } else { 492927ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 49300298fd71SBarry Smith c->compressedrow.i = NULL; 49310298fd71SBarry Smith c->compressedrow.rindex = NULL; 49326ad4291fSHong Zhang } 4933ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4934e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 49354846f1f5SKris Buschelman 49369566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 493769272f91SPierre Jolivet } 49389566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 49393a40ed3dSBarry Smith PetscFunctionReturn(0); 494017ab2063SBarry Smith } 494117ab2063SBarry Smith 4942d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 4943d71ae5a4SJacob Faibussowitsch { 4944b24902e0SBarry Smith PetscFunctionBegin; 49459566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 49469566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 494748a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 49489566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 49499566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 4950b24902e0SBarry Smith PetscFunctionReturn(0); 4951b24902e0SBarry Smith } 4952b24902e0SBarry Smith 4953d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4954d71ae5a4SJacob Faibussowitsch { 495552f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 495652f91c60SVaclav Hapla 495752f91c60SVaclav Hapla PetscFunctionBegin; 495852f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 495952f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 4960c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 49619566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 49629566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 49639566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 496452f91c60SVaclav Hapla if (isbinary) { 49659566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 496652f91c60SVaclav Hapla } else if (ishdf5) { 496752f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 49689566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 496952f91c60SVaclav Hapla #else 497052f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 497152f91c60SVaclav Hapla #endif 497252f91c60SVaclav Hapla } else { 497398921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 497452f91c60SVaclav Hapla } 497552f91c60SVaclav Hapla PetscFunctionReturn(0); 497652f91c60SVaclav Hapla } 497752f91c60SVaclav Hapla 4978d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 4979d71ae5a4SJacob Faibussowitsch { 49803ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 49813ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 4982fbdbba38SShri Abhyankar 4983fbdbba38SShri Abhyankar PetscFunctionBegin; 49849566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 4985bbead8a2SBarry Smith 49863ea6fe3dSLisandro Dalcin /* read in matrix header */ 49879566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 498808401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 49899371c9d4SSatish Balay M = header[1]; 49909371c9d4SSatish Balay N = header[2]; 49919371c9d4SSatish Balay nz = header[3]; 499208401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 499308401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 499408401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 4995fbdbba38SShri Abhyankar 49963ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 49979566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 49983ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 49993ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 50003ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 50013ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 50023ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 50039566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 50049566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 50053ea6fe3dSLisandro Dalcin 50063ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 50079566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5008aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 50093ea6fe3dSLisandro Dalcin 5010fbdbba38SShri Abhyankar /* read in row lengths */ 50119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 50129566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 50133ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 50149371c9d4SSatish Balay sum = 0; 50159371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 501608401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 50173ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 50189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 50199566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5020aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 50213ea6fe3dSLisandro Dalcin /* store row lengths */ 50229566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 50239566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5024fbdbba38SShri Abhyankar 50253ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 50269371c9d4SSatish Balay a->i[0] = 0; 50279371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 50283ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 50299566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 50303ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 50319566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5032fbdbba38SShri Abhyankar 50339566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 50349566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 5035fbdbba38SShri Abhyankar PetscFunctionReturn(0); 5036fbdbba38SShri Abhyankar } 5037fbdbba38SShri Abhyankar 5038d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5039d71ae5a4SJacob Faibussowitsch { 50407264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5041fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5042eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5043eeffb40dSHong Zhang PetscInt k; 5044eeffb40dSHong Zhang #endif 50457264ac53SSatish Balay 50463a40ed3dSBarry Smith PetscFunctionBegin; 5047bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5048d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5049ca44d042SBarry Smith *flg = PETSC_FALSE; 5050ca44d042SBarry Smith PetscFunctionReturn(0); 5051bcd2baecSBarry Smith } 50527264ac53SSatish Balay 50537264ac53SSatish Balay /* if the a->i are the same */ 50549566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 5055abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 50567264ac53SSatish Balay 50577264ac53SSatish Balay /* if a->j are the same */ 50589566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 5059abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 5060bcd2baecSBarry Smith 50619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5063bcd2baecSBarry Smith /* if a->a are the same */ 5064eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5065eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5066fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5067eeffb40dSHong Zhang *flg = PETSC_FALSE; 50683a40ed3dSBarry Smith PetscFunctionReturn(0); 5069eeffb40dSHong Zhang } 5070eeffb40dSHong Zhang } 5071eeffb40dSHong Zhang #else 50729566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5073eeffb40dSHong Zhang #endif 50749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 50759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 5076eeffb40dSHong Zhang PetscFunctionReturn(0); 50777264ac53SSatish Balay } 507836db0b34SBarry Smith 507905869f15SSatish Balay /*@ 508011a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 508136db0b34SBarry Smith provided by the user. 508236db0b34SBarry Smith 5083d083f849SBarry Smith Collective 508436db0b34SBarry Smith 508536db0b34SBarry Smith Input Parameters: 508636db0b34SBarry Smith + comm - must be an MPI communicator of size 1 508736db0b34SBarry Smith . m - number of rows 508836db0b34SBarry Smith . n - number of columns 5089483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 509036db0b34SBarry Smith . j - column indices 509136db0b34SBarry Smith - a - matrix values 509236db0b34SBarry Smith 509336db0b34SBarry Smith Output Parameter: 509436db0b34SBarry Smith . mat - the matrix 509536db0b34SBarry Smith 509636db0b34SBarry Smith Level: intermediate 509736db0b34SBarry Smith 509836db0b34SBarry Smith Notes: 50990551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 5100292fb18eSBarry Smith once the matrix is destroyed and not before 510136db0b34SBarry Smith 510236db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 510336db0b34SBarry Smith 5104bfeeae90SHong Zhang The i and j indices are 0 based 510536db0b34SBarry Smith 5106a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5107a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 51088eef79e4SBarry Smith as shown 5109a4552177SSatish Balay 51108eef79e4SBarry Smith $ 1 0 0 51118eef79e4SBarry Smith $ 2 0 3 51128eef79e4SBarry Smith $ 4 5 6 51138eef79e4SBarry Smith $ 51148eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 51158eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 51168eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 5117a4552177SSatish Balay 5118db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 511936db0b34SBarry Smith @*/ 5120d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5121d71ae5a4SJacob Faibussowitsch { 5122cbcfb4deSHong Zhang PetscInt ii; 512336db0b34SBarry Smith Mat_SeqAIJ *aij; 5124cbcfb4deSHong Zhang PetscInt jj; 512536db0b34SBarry Smith 512636db0b34SBarry Smith PetscFunctionBegin; 5127aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 51289566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51299566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51309566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 51319566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5133ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 51349566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 51359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5136ab93d7beSBarry Smith 513736db0b34SBarry Smith aij->i = i; 513836db0b34SBarry Smith aij->j = j; 513936db0b34SBarry Smith aij->a = a; 514036db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 514136db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5142e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5143e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 514436db0b34SBarry Smith 5145cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 514636db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 514776bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5148aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 51499985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 515008401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 515108401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 51529985e31cSBarry Smith } 515336db0b34SBarry Smith } 515476bd3646SJed Brown } 515576bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 515636db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 515708401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5158aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 515936db0b34SBarry Smith } 516076bd3646SJed Brown } 516136db0b34SBarry Smith 51629566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 51639566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 516436db0b34SBarry Smith PetscFunctionReturn(0); 516536db0b34SBarry Smith } 5166cbc6b225SStefano Zampini 5167f62e3866SBarry Smith /*@ 516811a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 51698a0b0e6bSVictor Minden provided by the user. 51708a0b0e6bSVictor Minden 5171d083f849SBarry Smith Collective 51728a0b0e6bSVictor Minden 51738a0b0e6bSVictor Minden Input Parameters: 51748a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 51758a0b0e6bSVictor Minden . m - number of rows 51768a0b0e6bSVictor Minden . n - number of columns 51778a0b0e6bSVictor Minden . i - row indices 51788a0b0e6bSVictor Minden . j - column indices 51791230e6d1SVictor Minden . a - matrix values 51801230e6d1SVictor Minden . nz - number of nonzeros 518111a5261eSBarry Smith - idx - if the i and j indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 51828a0b0e6bSVictor Minden 51838a0b0e6bSVictor Minden Output Parameter: 51848a0b0e6bSVictor Minden . mat - the matrix 51858a0b0e6bSVictor Minden 51868a0b0e6bSVictor Minden Level: intermediate 51878a0b0e6bSVictor Minden 5188f62e3866SBarry Smith Example: 5189f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 51909e99939fSJunchao Zhang .vb 51918a0b0e6bSVictor Minden 1 0 0 51928a0b0e6bSVictor Minden 2 0 3 51938a0b0e6bSVictor Minden 4 5 6 51948a0b0e6bSVictor Minden 51958a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 51968a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 51978a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 51989e99939fSJunchao Zhang .ve 5199d7547e51SJunchao Zhang Notes: 5200d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5201d7547e51SJunchao Zhang and are particularly useful in iterative applications. 52028a0b0e6bSVictor Minden 5203d7547e51SJunchao Zhang .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 52048a0b0e6bSVictor Minden @*/ 5205d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5206d71ae5a4SJacob Faibussowitsch { 5207d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 52088a0b0e6bSVictor Minden 52098a0b0e6bSVictor Minden PetscFunctionBegin; 52109566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5211ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 52129566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 52139566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 52149566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 52159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 52161230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 52171230e6d1SVictor Minden if (idx) { 52181230e6d1SVictor Minden row = i[ii] - 1; 52191230e6d1SVictor Minden col = j[ii] - 1; 52201230e6d1SVictor Minden } else { 52211230e6d1SVictor Minden row = i[ii]; 52221230e6d1SVictor Minden col = j[ii]; 52238a0b0e6bSVictor Minden } 52249566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 52258a0b0e6bSVictor Minden } 52269566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52279566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52289566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 52298a0b0e6bSVictor Minden PetscFunctionReturn(0); 52308a0b0e6bSVictor Minden } 523136db0b34SBarry Smith 5232d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5233d71ae5a4SJacob Faibussowitsch { 5234acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5235acf2f550SJed Brown 5236acf2f550SJed Brown PetscFunctionBegin; 5237acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5238acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 52392205254eSKarl Rupp 52409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 5241acf2f550SJed Brown PetscFunctionReturn(0); 5242acf2f550SJed Brown } 5243acf2f550SJed Brown 5244d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5245d71ae5a4SJacob Faibussowitsch { 52469c8f2541SHong Zhang PetscFunctionBegin; 52479566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 52489c8f2541SHong Zhang PetscFunctionReturn(0); 52499c8f2541SHong Zhang } 52509c8f2541SHong Zhang 525181824310SBarry Smith /* 525253dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 525353dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 525453dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 525553dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 525653dd7562SDmitry Karpeev */ 5257d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5258d71ae5a4SJacob Faibussowitsch { 525953dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 526053dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 526153dd7562SDmitry Karpeev PetscBool seqaij; 526253dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 526353dd7562SDmitry Karpeev PetscScalar v; 526453dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 526553dd7562SDmitry Karpeev 526653dd7562SDmitry Karpeev PetscFunctionBegin; 526753dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 526853dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 52699566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 527028b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 527153dd7562SDmitry Karpeev if (rowemb) { 52729566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 527308401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 527453dd7562SDmitry Karpeev } else { 527508401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 527653dd7562SDmitry Karpeev } 527753dd7562SDmitry Karpeev if (colemb) { 52789566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 527908401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 528053dd7562SDmitry Karpeev } else { 528108401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 528253dd7562SDmitry Karpeev } 528353dd7562SDmitry Karpeev 528453dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ *)(B->data); 528553dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 52869566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5287ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 52889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 52899566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 529053dd7562SDmitry Karpeev } 529148a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 529253dd7562SDmitry Karpeev count = 0; 529353dd7562SDmitry Karpeev rowindices = NULL; 529453dd7562SDmitry Karpeev colindices = NULL; 529548a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 529648a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 529753dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 529853dd7562SDmitry Karpeev PetscInt row; 529953dd7562SDmitry Karpeev row = i; 530053dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 530153dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 530253dd7562SDmitry Karpeev PetscInt col; 530353dd7562SDmitry Karpeev col = Baij->j[count]; 530453dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 530553dd7562SDmitry Karpeev v = Baij->a[count]; 53069566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 530753dd7562SDmitry Karpeev ++count; 530853dd7562SDmitry Karpeev } 530953dd7562SDmitry Karpeev } 531053dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 531153dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 531253dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 531353dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 531453dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 531553dd7562SDmitry Karpeev PetscFunctionReturn(0); 531653dd7562SDmitry Karpeev } 531753dd7562SDmitry Karpeev 5318dec0b466SHong Zhang PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A) 5319dec0b466SHong Zhang { 5320dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5321dec0b466SHong Zhang MatScalar *aa = a->a; 5322dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5323dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5324dec0b466SHong Zhang 5325dec0b466SHong Zhang PetscFunctionBegin; 5326dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5327dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5328dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5329dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5330dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 5331dec0b466SHong Zhang if (aa[k] == 0 && aj[k] != i - 1) fshift++; 5332dec0b466SHong Zhang else { 5333dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5334dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5335dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5336dec0b466SHong Zhang } 5337dec0b466SHong Zhang } 5338dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5339dec0b466SHong Zhang fshift_prev = fshift; 5340dec0b466SHong Zhang /* reset ilen and imax for each row */ 5341dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5342dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5343dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5344dec0b466SHong Zhang } 5345dec0b466SHong Zhang if (m) { 5346dec0b466SHong Zhang ai[m] -= fshift; 5347dec0b466SHong Zhang a->nz = ai[m]; 5348dec0b466SHong Zhang } 5349dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5350dec0b466SHong Zhang A->nonzerostate -= fshift; 5351dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5352dec0b466SHong Zhang a->rmax = rmax; 5353dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5354dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5355dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 5356dec0b466SHong Zhang PetscFunctionReturn(0); 5357dec0b466SHong Zhang } 5358dec0b466SHong Zhang 53594099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 53604099cc6bSBarry Smith 53614099cc6bSBarry Smith /*@C 536211a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 53634099cc6bSBarry Smith 5364c3339decSBarry Smith Collective 53654099cc6bSBarry Smith 53664099cc6bSBarry Smith Input Parameters: 53674099cc6bSBarry Smith + mat - the matrix object 53684099cc6bSBarry Smith - matype - matrix type 53694099cc6bSBarry Smith 53704099cc6bSBarry Smith Options Database Key: 53714099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 53724099cc6bSBarry Smith 53734099cc6bSBarry Smith Level: intermediate 53744099cc6bSBarry Smith 5375db781477SPatrick Sanan .seealso: `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`, `Mat` 53764099cc6bSBarry Smith @*/ 5377d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5378d71ae5a4SJacob Faibussowitsch { 53794099cc6bSBarry Smith PetscBool sametype; 53805f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 53814099cc6bSBarry Smith 53824099cc6bSBarry Smith PetscFunctionBegin; 53834099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 53849566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 53854099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 53864099cc6bSBarry Smith 53879566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 53885f80ce2aSJacob Faibussowitsch PetscCheck(r, PETSC_COMM_SELF, PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 53899566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 53904099cc6bSBarry Smith PetscFunctionReturn(0); 53914099cc6bSBarry Smith } 53924099cc6bSBarry Smith 53934099cc6bSBarry Smith /*@C 539411a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 53954099cc6bSBarry Smith 53964099cc6bSBarry Smith Not Collective 53974099cc6bSBarry Smith 53984099cc6bSBarry Smith Input Parameters: 539911a5261eSBarry Smith + name - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 54004099cc6bSBarry Smith - function - routine to convert to subtype 54014099cc6bSBarry Smith 54024099cc6bSBarry Smith Notes: 540311a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 54044099cc6bSBarry Smith 54054099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 54064099cc6bSBarry Smith $ -mat_seqaij_type my_mat 54074099cc6bSBarry Smith 54084099cc6bSBarry Smith Level: advanced 54094099cc6bSBarry Smith 5410db781477SPatrick Sanan .seealso: `MatSeqAIJRegisterAll()` 54114099cc6bSBarry Smith @*/ 5412d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5413d71ae5a4SJacob Faibussowitsch { 54144099cc6bSBarry Smith PetscFunctionBegin; 54159566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 54169566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 54174099cc6bSBarry Smith PetscFunctionReturn(0); 54184099cc6bSBarry Smith } 54194099cc6bSBarry Smith 54204099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 54214099cc6bSBarry Smith 54224099cc6bSBarry Smith /*@C 542311a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 54244099cc6bSBarry Smith 54254099cc6bSBarry Smith Not Collective 54264099cc6bSBarry Smith 54274099cc6bSBarry Smith Level: advanced 54284099cc6bSBarry Smith 5429db781477SPatrick Sanan .seealso: `MatRegisterAll()`, `MatSeqAIJRegister()` 54304099cc6bSBarry Smith @*/ 5431d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5432d71ae5a4SJacob Faibussowitsch { 54334099cc6bSBarry Smith PetscFunctionBegin; 54344099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 54354099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 54364099cc6bSBarry Smith 54379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 54389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 54399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 54409779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 54419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5442485f9817SRichard Tran Mills #endif 54435063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 54449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 54455063d097SStefano Zampini #endif 5446d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 5447d5e393b6SSuyash Tandon PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 5448d5e393b6SSuyash Tandon #endif 54495063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 54509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 54515063d097SStefano Zampini #endif 54524099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 54539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 54544099cc6bSBarry Smith #endif 54554099cc6bSBarry Smith PetscFunctionReturn(0); 54564099cc6bSBarry Smith } 545753dd7562SDmitry Karpeev 545853dd7562SDmitry Karpeev /* 545981824310SBarry Smith Special version for direct calls from Fortran 546081824310SBarry Smith */ 5461af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 546281824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 546381824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 546481824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 546581824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 546681824310SBarry Smith #endif 546781824310SBarry Smith 546881824310SBarry Smith /* Change these macros so can be used in void function */ 546998921bdaSJacob Faibussowitsch 547098921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 54719566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 54729566063dSJacob Faibussowitsch #undef PetscCall 54739371c9d4SSatish Balay #define PetscCall(...) \ 54749371c9d4SSatish Balay do { \ 54755f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 547698921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 547798921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 547898921bdaSJacob Faibussowitsch return; \ 547998921bdaSJacob Faibussowitsch } \ 548098921bdaSJacob Faibussowitsch } while (0) 548198921bdaSJacob Faibussowitsch 548298921bdaSJacob Faibussowitsch #undef SETERRQ 54839371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 54849371c9d4SSatish Balay do { \ 548598921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 548698921bdaSJacob Faibussowitsch return; \ 548798921bdaSJacob Faibussowitsch } while (0) 548881824310SBarry Smith 5489d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5490d71ae5a4SJacob Faibussowitsch { 549181824310SBarry Smith Mat A = *AA; 549281824310SBarry Smith PetscInt m = *mm, n = *nn; 549381824310SBarry Smith InsertMode is = *isis; 549481824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 549581824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 549681824310SBarry Smith PetscInt *imax, *ai, *ailen; 549781824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 549854f21887SBarry Smith MatScalar *ap, value, *aa; 5499ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5500ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 550181824310SBarry Smith 550281824310SBarry Smith PetscFunctionBegin; 55034994cf47SJed Brown MatCheckPreallocated(A, 1); 550481824310SBarry Smith imax = a->imax; 550581824310SBarry Smith ai = a->i; 550681824310SBarry Smith ailen = a->ilen; 550781824310SBarry Smith aj = a->j; 550881824310SBarry Smith aa = a->a; 550981824310SBarry Smith 551081824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 551181824310SBarry Smith row = im[k]; 551281824310SBarry Smith if (row < 0) continue; 55135f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 55149371c9d4SSatish Balay rp = aj + ai[row]; 55159371c9d4SSatish Balay ap = aa + ai[row]; 55169371c9d4SSatish Balay rmax = imax[row]; 55179371c9d4SSatish Balay nrow = ailen[row]; 551881824310SBarry Smith low = 0; 551981824310SBarry Smith high = nrow; 552081824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 552181824310SBarry Smith if (in[l] < 0) continue; 55225f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 552381824310SBarry Smith col = in[l]; 55242205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 55252205254eSKarl Rupp else value = v[k + l * m]; 55262205254eSKarl Rupp 552781824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 552881824310SBarry Smith 55292205254eSKarl Rupp if (col <= lastcol) low = 0; 55302205254eSKarl Rupp else high = nrow; 553181824310SBarry Smith lastcol = col; 553281824310SBarry Smith while (high - low > 5) { 553381824310SBarry Smith t = (low + high) / 2; 553481824310SBarry Smith if (rp[t] > col) high = t; 553581824310SBarry Smith else low = t; 553681824310SBarry Smith } 553781824310SBarry Smith for (i = low; i < high; i++) { 553881824310SBarry Smith if (rp[i] > col) break; 553981824310SBarry Smith if (rp[i] == col) { 554081824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 554181824310SBarry Smith else ap[i] = value; 554281824310SBarry Smith goto noinsert; 554381824310SBarry Smith } 554481824310SBarry Smith } 554581824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 554681824310SBarry Smith if (nonew == 1) goto noinsert; 55475f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5548fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 55499371c9d4SSatish Balay N = nrow++ - 1; 55509371c9d4SSatish Balay a->nz++; 55519371c9d4SSatish Balay high++; 555281824310SBarry Smith /* shift up all the later entries in this row */ 555381824310SBarry Smith for (ii = N; ii >= i; ii--) { 555481824310SBarry Smith rp[ii + 1] = rp[ii]; 555581824310SBarry Smith ap[ii + 1] = ap[ii]; 555681824310SBarry Smith } 555781824310SBarry Smith rp[i] = col; 555881824310SBarry Smith ap[i] = value; 5559e56f5c9eSBarry Smith A->nonzerostate++; 556081824310SBarry Smith noinsert:; 556181824310SBarry Smith low = i + 1; 556281824310SBarry Smith } 556381824310SBarry Smith ailen[row] = nrow; 556481824310SBarry Smith } 556581824310SBarry Smith PetscFunctionReturnVoid(); 556681824310SBarry Smith } 556798921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 556898921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 556998921bdaSJacob Faibussowitsch * original definitions */ 55709566063dSJacob Faibussowitsch #undef PetscCall 557198921bdaSJacob Faibussowitsch #undef SETERRQ 5572