1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 11d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 12d71ae5a4SJacob Faibussowitsch { 134099cc6bSBarry Smith PetscBool flg; 144099cc6bSBarry Smith char type[256]; 154099cc6bSBarry Smith 164099cc6bSBarry Smith PetscFunctionBegin; 17d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 189566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 199566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 20d0609cedSBarry Smith PetscOptionsEnd(); 214099cc6bSBarry Smith PetscFunctionReturn(0); 224099cc6bSBarry Smith } 234099cc6bSBarry Smith 24d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 25d71ae5a4SJacob Faibussowitsch { 260716a85fSBarry Smith PetscInt i, m, n; 270716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 280716a85fSBarry Smith 290716a85fSBarry Smith PetscFunctionBegin; 309566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 319566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 320716a85fSBarry Smith if (type == NORM_2) { 33ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 340716a85fSBarry Smith } else if (type == NORM_1) { 35ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 360716a85fSBarry Smith } else if (type == NORM_INFINITY) { 37ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 38857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 39ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 40857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 42857cbf51SRichard Tran Mills } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 430716a85fSBarry Smith 440716a85fSBarry Smith if (type == NORM_2) { 45a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 47a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 480716a85fSBarry Smith } 490716a85fSBarry Smith PetscFunctionReturn(0); 500716a85fSBarry Smith } 510716a85fSBarry Smith 52d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 53d71ae5a4SJacob Faibussowitsch { 543a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 553a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 563a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 573a062f41SBarry Smith PetscInt *rows; 583a062f41SBarry Smith 593a062f41SBarry Smith PetscFunctionBegin; 603a062f41SBarry Smith for (i = 0; i < m; i++) { 61ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 623a062f41SBarry Smith } 639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 643a062f41SBarry Smith cnt = 0; 653a062f41SBarry Smith for (i = 0; i < m; i++) { 663a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 673a062f41SBarry Smith rows[cnt] = i; 683a062f41SBarry Smith cnt++; 693a062f41SBarry Smith } 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 723a062f41SBarry Smith PetscFunctionReturn(0); 733a062f41SBarry Smith } 743a062f41SBarry Smith 75d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 76d71ae5a4SJacob Faibussowitsch { 776ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 78fff043a9SJunchao Zhang const MatScalar *aa; 796ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 80b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 816ce1633cSBarry Smith PetscInt *rows; 826ce1633cSBarry Smith 836ce1633cSBarry Smith PetscFunctionBegin; 849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 859566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 866ce1633cSBarry Smith diag = a->diag; 876ce1633cSBarry Smith for (i = 0; i < m; i++) { 88ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 896ce1633cSBarry Smith } 909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 916ce1633cSBarry Smith cnt = 0; 926ce1633cSBarry Smith for (i = 0; i < m; i++) { 93ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 946ce1633cSBarry Smith } 95f1f41ecbSJed Brown *nrows = cnt; 96f1f41ecbSJed Brown *zrows = rows; 979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 98f1f41ecbSJed Brown PetscFunctionReturn(0); 99f1f41ecbSJed Brown } 100f1f41ecbSJed Brown 101d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 102d71ae5a4SJacob Faibussowitsch { 103f1f41ecbSJed Brown PetscInt nrows, *rows; 104f1f41ecbSJed Brown 105f1f41ecbSJed Brown PetscFunctionBegin; 1060298fd71SBarry Smith *zrows = NULL; 1079566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1089566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1096ce1633cSBarry Smith PetscFunctionReturn(0); 1106ce1633cSBarry Smith } 1116ce1633cSBarry Smith 112d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 113d71ae5a4SJacob Faibussowitsch { 114b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 115b3a44c85SBarry Smith const MatScalar *aa; 116b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 117b3a44c85SBarry Smith const PetscInt *ii; 118b3a44c85SBarry Smith PetscInt n, i, j, *rows; 119b3a44c85SBarry Smith 120b3a44c85SBarry Smith PetscFunctionBegin; 1219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 122f4259b30SLisandro Dalcin *keptrows = NULL; 123b3a44c85SBarry Smith ii = a->i; 124b3a44c85SBarry Smith for (i = 0; i < m; i++) { 125b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 126b3a44c85SBarry Smith if (!n) { 127b3a44c85SBarry Smith cnt++; 128b3a44c85SBarry Smith goto ok1; 129b3a44c85SBarry Smith } 1302e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 131b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 132b3a44c85SBarry Smith } 133b3a44c85SBarry Smith cnt++; 134b3a44c85SBarry Smith ok1:; 135b3a44c85SBarry Smith } 1362e5835c6SStefano Zampini if (!cnt) { 1379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1382e5835c6SStefano Zampini PetscFunctionReturn(0); 1392e5835c6SStefano Zampini } 1409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 141b3a44c85SBarry Smith cnt = 0; 142b3a44c85SBarry Smith for (i = 0; i < m; i++) { 143b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 144b3a44c85SBarry Smith if (!n) continue; 1452e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 146b3a44c85SBarry Smith if (aa[j] != 0.0) { 147b3a44c85SBarry Smith rows[cnt++] = i; 148b3a44c85SBarry Smith break; 149b3a44c85SBarry Smith } 150b3a44c85SBarry Smith } 151b3a44c85SBarry Smith } 1529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1539566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 154b3a44c85SBarry Smith PetscFunctionReturn(0); 155b3a44c85SBarry Smith } 156b3a44c85SBarry Smith 157d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 158d71ae5a4SJacob Faibussowitsch { 15979299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16099e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16199e65526SBarry Smith const PetscInt *diag; 1622e5835c6SStefano Zampini MatScalar *aa; 16399e65526SBarry Smith const PetscScalar *v; 164ace3abfcSBarry Smith PetscBool missing; 16579299369SBarry Smith 16679299369SBarry Smith PetscFunctionBegin; 16709f38230SBarry Smith if (Y->assembled) { 1689566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 16909f38230SBarry Smith if (!missing) { 17079299369SBarry Smith diag = aij->diag; 1719566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 17379299369SBarry Smith if (is == INSERT_VALUES) { 174ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 17579299369SBarry Smith } else { 176ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 17779299369SBarry Smith } 1789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1799566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 18079299369SBarry Smith PetscFunctionReturn(0); 18179299369SBarry Smith } 1829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 18309f38230SBarry Smith } 1849566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 18509f38230SBarry Smith PetscFunctionReturn(0); 18609f38230SBarry Smith } 18779299369SBarry Smith 188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 189d71ae5a4SJacob Faibussowitsch { 190416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19197f1f81fSBarry Smith PetscInt i, ishift; 19217ab2063SBarry Smith 1933a40ed3dSBarry Smith PetscFunctionBegin; 194f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 1953a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 196bfeeae90SHong Zhang ishift = 0; 197b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 1989566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 199bfeeae90SHong Zhang } else if (oshift == 1) { 2001a83f524SJed Brown PetscInt *tia; 201d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2023b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2041a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2051a83f524SJed Brown *ia = tia; 206ecc77c7aSBarry Smith if (ja) { 2071a83f524SJed Brown PetscInt *tja; 2089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2091a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2101a83f524SJed Brown *ja = tja; 211ecc77c7aSBarry Smith } 2126945ee14SBarry Smith } else { 213ecc77c7aSBarry Smith *ia = a->i; 214ecc77c7aSBarry Smith if (ja) *ja = a->j; 215a2ce50c7SBarry Smith } 2163a40ed3dSBarry Smith PetscFunctionReturn(0); 217a2744918SBarry Smith } 218a2744918SBarry Smith 219d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 220d71ae5a4SJacob Faibussowitsch { 2213a40ed3dSBarry Smith PetscFunctionBegin; 2223a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 223b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2249566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2259566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 226bcd2baecSBarry Smith } 2273a40ed3dSBarry Smith PetscFunctionReturn(0); 22817ab2063SBarry Smith } 22917ab2063SBarry Smith 230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 231d71ae5a4SJacob Faibussowitsch { 2323b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 233d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 23497f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2353b2fbd54SBarry Smith 2363a40ed3dSBarry Smith PetscFunctionBegin; 237899cda47SBarry Smith *nn = n; 2383a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2393b2fbd54SBarry Smith if (symmetric) { 2409566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2413b2fbd54SBarry Smith } else { 2429566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2453b2fbd54SBarry Smith jj = a->j; 246ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2473b2fbd54SBarry Smith cia[0] = oshift; 248ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2499566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2503b2fbd54SBarry Smith jj = a->j; 251a93ec695SBarry Smith for (row = 0; row < m; row++) { 252a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 253a93ec695SBarry Smith for (i = 0; i < mr; i++) { 254bfeeae90SHong Zhang col = *jj++; 2552205254eSKarl Rupp 2563b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2573b2fbd54SBarry Smith } 2583b2fbd54SBarry Smith } 2599566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2609371c9d4SSatish Balay *ia = cia; 2619371c9d4SSatish Balay *ja = cja; 2623b2fbd54SBarry Smith } 2633a40ed3dSBarry Smith PetscFunctionReturn(0); 2643b2fbd54SBarry Smith } 2653b2fbd54SBarry Smith 266d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 267d71ae5a4SJacob Faibussowitsch { 2683a40ed3dSBarry Smith PetscFunctionBegin; 2693a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2703b2fbd54SBarry Smith 2719566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2729566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2733a40ed3dSBarry Smith PetscFunctionReturn(0); 2743b2fbd54SBarry Smith } 2753b2fbd54SBarry Smith 2767cee066cSHong Zhang /* 2777cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2787cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 279040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2807cee066cSHong Zhang */ 281d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 282d71ae5a4SJacob Faibussowitsch { 2837cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2847cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 285071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2867cee066cSHong Zhang PetscInt *cspidx; 287071fcb05SBarry Smith const PetscInt *jj; 2887cee066cSHong Zhang 2897cee066cSHong Zhang PetscFunctionBegin; 2907cee066cSHong Zhang *nn = n; 2917cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 292625f6d37SHong Zhang 2939566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2959566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2969566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 2977cee066cSHong Zhang jj = a->j; 298ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2997cee066cSHong Zhang cia[0] = oshift; 300ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3019566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3027cee066cSHong Zhang jj = a->j; 3037cee066cSHong Zhang for (row = 0; row < m; row++) { 3047cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3057cee066cSHong Zhang for (i = 0; i < mr; i++) { 3067cee066cSHong Zhang col = *jj++; 307071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 308071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 309071fcb05SBarry Smith cja[tmp] = row + oshift; 3107cee066cSHong Zhang } 3117cee066cSHong Zhang } 3129566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 313071fcb05SBarry Smith *ia = cia; 314071fcb05SBarry Smith *ja = cja; 3157cee066cSHong Zhang *spidx = cspidx; 3167cee066cSHong Zhang PetscFunctionReturn(0); 3177cee066cSHong Zhang } 3187cee066cSHong Zhang 319d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 320d71ae5a4SJacob Faibussowitsch { 3217cee066cSHong Zhang PetscFunctionBegin; 3229566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3239566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3247cee066cSHong Zhang PetscFunctionReturn(0); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 328d71ae5a4SJacob Faibussowitsch { 32987d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33087d4246cSBarry Smith PetscInt *ai = a->i; 331fff043a9SJunchao Zhang PetscScalar *aa; 33287d4246cSBarry Smith 33387d4246cSBarry Smith PetscFunctionBegin; 3349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3359566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 33787d4246cSBarry Smith PetscFunctionReturn(0); 33887d4246cSBarry Smith } 33987d4246cSBarry Smith 340bd04181cSBarry Smith /* 341bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 342bd04181cSBarry Smith 343bd04181cSBarry Smith - a single row of values is set with each call 344bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 345bd04181cSBarry Smith - the values are always added to the matrix, not set 346bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 347bd04181cSBarry Smith 3481f763a69SBarry Smith This does NOT assume the global column indices are sorted 349bd04181cSBarry Smith 3501f763a69SBarry Smith */ 351bd04181cSBarry Smith 352af0996ceSBarry Smith #include <petsc/private/isimpl.h> 353d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 354d71ae5a4SJacob Faibussowitsch { 355189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3561f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3571f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3581f763a69SBarry Smith PetscInt lastcol = -1; 359fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 360189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 361189e4007SBarry Smith 362fff043a9SJunchao Zhang PetscFunctionBegin; 3639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 364f38dd0b8SBarry Smith row = ridx[im[0]]; 3651f763a69SBarry Smith rp = aj + ai[row]; 3661f763a69SBarry Smith ap = aa + ai[row]; 3671f763a69SBarry Smith nrow = ailen[row]; 368189e4007SBarry Smith low = 0; 369189e4007SBarry Smith high = nrow; 370189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 371189e4007SBarry Smith col = cidx[in[l]]; 372f38dd0b8SBarry Smith value = v[l]; 373189e4007SBarry Smith 374189e4007SBarry Smith if (col <= lastcol) low = 0; 375189e4007SBarry Smith else high = nrow; 376189e4007SBarry Smith lastcol = col; 377189e4007SBarry Smith while (high - low > 5) { 378189e4007SBarry Smith t = (low + high) / 2; 379189e4007SBarry Smith if (rp[t] > col) high = t; 380189e4007SBarry Smith else low = t; 381189e4007SBarry Smith } 382189e4007SBarry Smith for (i = low; i < high; i++) { 383189e4007SBarry Smith if (rp[i] == col) { 3841f763a69SBarry Smith ap[i] += value; 385189e4007SBarry Smith low = i + 1; 3861f763a69SBarry Smith break; 387189e4007SBarry Smith } 388189e4007SBarry Smith } 389189e4007SBarry Smith } 3909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 391f38dd0b8SBarry Smith return 0; 392189e4007SBarry Smith } 393189e4007SBarry Smith 394d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 395d71ae5a4SJacob Faibussowitsch { 396416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 397e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 39897f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 399e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 400ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 401ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 402ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 40317ab2063SBarry Smith 4043a40ed3dSBarry Smith PetscFunctionBegin; 4059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 40617ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 407416022c9SBarry Smith row = im[k]; 4085ef9f2a5SBarry Smith if (row < 0) continue; 4096bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 410720833daSHong Zhang rp = aj + ai[row]; 411876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 4129371c9d4SSatish Balay rmax = imax[row]; 4139371c9d4SSatish Balay nrow = ailen[row]; 414416022c9SBarry Smith low = 0; 415c71e6ed7SBarry Smith high = nrow; 41617ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4175ef9f2a5SBarry Smith if (in[l] < 0) continue; 4186bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 419bfeeae90SHong Zhang col = in[l]; 420071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 421071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 42236db0b34SBarry Smith 4232205254eSKarl Rupp if (col <= lastcol) low = 0; 4242205254eSKarl Rupp else high = nrow; 425e2ee6c50SBarry Smith lastcol = col; 426416022c9SBarry Smith while (high - low > 5) { 427416022c9SBarry Smith t = (low + high) / 2; 428416022c9SBarry Smith if (rp[t] > col) high = t; 429416022c9SBarry Smith else low = t; 43017ab2063SBarry Smith } 431416022c9SBarry Smith for (i = low; i < high; i++) { 43217ab2063SBarry Smith if (rp[i] > col) break; 43317ab2063SBarry Smith if (rp[i] == col) { 434876c6284SHong Zhang if (!A->structure_only) { 4350c0d7e18SFande Kong if (is == ADD_VALUES) { 4360c0d7e18SFande Kong ap[i] += value; 4370c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4389371c9d4SSatish Balay } else ap[i] = value; 439720833daSHong Zhang } 440e44c0bd4SBarry Smith low = i + 1; 44117ab2063SBarry Smith goto noinsert; 44217ab2063SBarry Smith } 44317ab2063SBarry Smith } 444dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 445c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 44608401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 447720833daSHong Zhang if (A->structure_only) { 448876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 449720833daSHong Zhang } else { 450fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 451720833daSHong Zhang } 4529371c9d4SSatish Balay N = nrow++ - 1; 4539371c9d4SSatish Balay a->nz++; 4549371c9d4SSatish Balay high++; 455416022c9SBarry Smith /* shift up all the later entries in this row */ 4569566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 45717ab2063SBarry Smith rp[i] = col; 458580bdb30SBarry Smith if (!A->structure_only) { 4599566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 460580bdb30SBarry Smith ap[i] = value; 461580bdb30SBarry Smith } 462416022c9SBarry Smith low = i + 1; 463e56f5c9eSBarry Smith A->nonzerostate++; 464e44c0bd4SBarry Smith noinsert:; 46517ab2063SBarry Smith } 46617ab2063SBarry Smith ailen[row] = nrow; 46717ab2063SBarry Smith } 4689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4693a40ed3dSBarry Smith PetscFunctionReturn(0); 47017ab2063SBarry Smith } 47117ab2063SBarry Smith 472d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 473d71ae5a4SJacob Faibussowitsch { 47419b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 47519b08ed1SBarry Smith PetscInt *rp, k, row; 47619b08ed1SBarry Smith PetscInt *ai = a->i; 47719b08ed1SBarry Smith PetscInt *aj = a->j; 478fff043a9SJunchao Zhang MatScalar *aa, *ap; 47919b08ed1SBarry Smith 48019b08ed1SBarry Smith PetscFunctionBegin; 48128b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 48208401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 483fff043a9SJunchao Zhang 4849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 48519b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 48619b08ed1SBarry Smith row = im[k]; 48719b08ed1SBarry Smith rp = aj + ai[row]; 48819b08ed1SBarry Smith ap = aa + ai[row]; 48919b08ed1SBarry Smith 4909566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49119b08ed1SBarry Smith if (!A->structure_only) { 49219b08ed1SBarry Smith if (v) { 4939566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 49419b08ed1SBarry Smith v += n; 49519b08ed1SBarry Smith } else { 4969566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 49719b08ed1SBarry Smith } 49819b08ed1SBarry Smith } 49919b08ed1SBarry Smith a->ilen[row] = n; 50019b08ed1SBarry Smith a->imax[row] = n; 50119b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 50219b08ed1SBarry Smith a->nz += n; 50319b08ed1SBarry Smith } 5049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 50519b08ed1SBarry Smith PetscFunctionReturn(0); 50619b08ed1SBarry Smith } 50719b08ed1SBarry Smith 50819b08ed1SBarry Smith /*@ 50919b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51019b08ed1SBarry Smith 51119b08ed1SBarry Smith Input Parameters: 51211a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 51319b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 51419b08ed1SBarry Smith 51519b08ed1SBarry Smith Level: advanced 51619b08ed1SBarry Smith 51719b08ed1SBarry Smith Notes: 51819b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 51911a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52019b08ed1SBarry Smith as always with multiple matrix assemblies. 52119b08ed1SBarry Smith 522db781477SPatrick Sanan .seealso: `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 52319b08ed1SBarry Smith @*/ 52419b08ed1SBarry Smith 525d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 526d71ae5a4SJacob Faibussowitsch { 52719b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 52819b08ed1SBarry Smith 52919b08ed1SBarry Smith PetscFunctionBegin; 5309566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5319566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53219b08ed1SBarry Smith a->maxnz = nztotal; 5334dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 53419b08ed1SBarry Smith if (!a->ilen) { 5359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 53619b08ed1SBarry Smith } else { 5379566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 53819b08ed1SBarry Smith } 53919b08ed1SBarry Smith 54019b08ed1SBarry Smith /* allocate the matrix space */ 54119b08ed1SBarry Smith if (A->structure_only) { 5429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal, &a->j)); 5439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i)); 54419b08ed1SBarry Smith } else { 5459566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i)); 54619b08ed1SBarry Smith } 54719b08ed1SBarry Smith a->i[0] = 0; 54819b08ed1SBarry Smith if (A->structure_only) { 54919b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 55019b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55119b08ed1SBarry Smith } else { 55219b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 55319b08ed1SBarry Smith a->free_a = PETSC_TRUE; 55419b08ed1SBarry Smith } 55519b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 55619b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 55719b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 55819b08ed1SBarry Smith PetscFunctionReturn(0); 55919b08ed1SBarry Smith } 56019b08ed1SBarry Smith 561d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 562d71ae5a4SJacob Faibussowitsch { 563071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 564071fcb05SBarry Smith PetscInt *rp, k, row; 565071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 566071fcb05SBarry Smith PetscInt *aj = a->j; 567fff043a9SJunchao Zhang MatScalar *aa, *ap; 568071fcb05SBarry Smith 569071fcb05SBarry Smith PetscFunctionBegin; 5709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 571071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 572071fcb05SBarry Smith row = im[k]; 5736bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 574071fcb05SBarry Smith rp = aj + ai[row]; 575071fcb05SBarry Smith ap = aa + ai[row]; 57648a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 577071fcb05SBarry Smith if (!A->structure_only) { 578071fcb05SBarry Smith if (v) { 5799566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 580071fcb05SBarry Smith v += n; 581071fcb05SBarry Smith } else { 5829566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 583071fcb05SBarry Smith } 584071fcb05SBarry Smith } 585071fcb05SBarry Smith ailen[row] = n; 586071fcb05SBarry Smith a->nz += n; 587071fcb05SBarry Smith } 5889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 589071fcb05SBarry Smith PetscFunctionReturn(0); 590071fcb05SBarry Smith } 591071fcb05SBarry Smith 592d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 593d71ae5a4SJacob Faibussowitsch { 5947eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 59597f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59697f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 597fff043a9SJunchao Zhang MatScalar *ap, *aa; 5987eb43aa7SLois Curfman McInnes 5993a40ed3dSBarry Smith PetscFunctionBegin; 6009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 6017eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6027eb43aa7SLois Curfman McInnes row = im[k]; 6039371c9d4SSatish Balay if (row < 0) { 6049371c9d4SSatish Balay v += n; 6059371c9d4SSatish Balay continue; 6069371c9d4SSatish Balay } /* negative row */ 60754c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6089371c9d4SSatish Balay rp = aj + ai[row]; 6099371c9d4SSatish Balay ap = aa + ai[row]; 6107eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6117eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6129371c9d4SSatish Balay if (in[l] < 0) { 6139371c9d4SSatish Balay v++; 6149371c9d4SSatish Balay continue; 6159371c9d4SSatish Balay } /* negative column */ 61654c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 617bfeeae90SHong Zhang col = in[l]; 6189371c9d4SSatish Balay high = nrow; 6199371c9d4SSatish Balay low = 0; /* assume unsorted */ 6207eb43aa7SLois Curfman McInnes while (high - low > 5) { 6217eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6227eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6237eb43aa7SLois Curfman McInnes else low = t; 6247eb43aa7SLois Curfman McInnes } 6257eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6267eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6277eb43aa7SLois Curfman McInnes if (rp[i] == col) { 628b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6297eb43aa7SLois Curfman McInnes goto finished; 6307eb43aa7SLois Curfman McInnes } 6317eb43aa7SLois Curfman McInnes } 63297e567efSBarry Smith *v++ = 0.0; 6337eb43aa7SLois Curfman McInnes finished:; 6347eb43aa7SLois Curfman McInnes } 6357eb43aa7SLois Curfman McInnes } 6369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 6373a40ed3dSBarry Smith PetscFunctionReturn(0); 6387eb43aa7SLois Curfman McInnes } 6397eb43aa7SLois Curfman McInnes 640d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 641d71ae5a4SJacob Faibussowitsch { 6423ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 643c898d852SStefano Zampini const PetscScalar *av; 6443ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6453ea6fe3dSLisandro Dalcin PetscInt *rowlens; 64617ab2063SBarry Smith 6473a40ed3dSBarry Smith PetscFunctionBegin; 6489566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6492205254eSKarl Rupp 6503ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6513ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6523ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6533ea6fe3dSLisandro Dalcin nz = A->nz; 654416022c9SBarry Smith 6553ea6fe3dSLisandro Dalcin /* write matrix header */ 6563ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6579371c9d4SSatish Balay header[1] = M; 6589371c9d4SSatish Balay header[2] = N; 6599371c9d4SSatish Balay header[3] = nz; 6609566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 661416022c9SBarry Smith 6623ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6643ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6659566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6669566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6673ea6fe3dSLisandro Dalcin /* store column indices */ 6689566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 669416022c9SBarry Smith /* store nonzero values */ 6709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6719566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 673b37d52dbSMark F. Adams 6743ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6759566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6763a40ed3dSBarry Smith PetscFunctionReturn(0); 67717ab2063SBarry Smith } 678416022c9SBarry Smith 679d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 680d71ae5a4SJacob Faibussowitsch { 6817dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6827dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6837dc0baabSHong Zhang 6847dc0baabSHong Zhang PetscFunctionBegin; 6859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6867dc0baabSHong Zhang for (i = 0; i < m; i++) { 6879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 68848a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6907dc0baabSHong Zhang } 6919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6927dc0baabSHong Zhang PetscFunctionReturn(0); 6937dc0baabSHong Zhang } 6947dc0baabSHong Zhang 69509573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 696cd155464SBarry Smith 697d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 698d71ae5a4SJacob Faibussowitsch { 699416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 700c898d852SStefano Zampini const PetscScalar *av; 70160e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 702e060cb09SBarry Smith const char *name; 703f3ef73ceSBarry Smith PetscViewerFormat format; 70417ab2063SBarry Smith 7053a40ed3dSBarry Smith PetscFunctionBegin; 7067dc0baabSHong Zhang if (A->structure_only) { 7079566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7087dc0baabSHong Zhang PetscFunctionReturn(0); 7097dc0baabSHong Zhang } 71043e49210SHong Zhang 7119566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 7122e5835c6SStefano Zampini if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 7132e5835c6SStefano Zampini 714c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 71771c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 71897f1f81fSBarry Smith PetscInt nofinalvalue = 0; 71960e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 720c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 721d00d2cf4SBarry Smith nofinalvalue = 1; 722d00d2cf4SBarry Smith } 7239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 726fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 728fbfe6fa7SJed Brown #else 7299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 730fbfe6fa7SJed Brown #endif 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73217ab2063SBarry Smith 73317ab2063SBarry Smith for (i = 0; i < m; i++) { 73460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 735aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 73717ab2063SBarry Smith #else 7389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 73917ab2063SBarry Smith #endif 74017ab2063SBarry Smith } 74117ab2063SBarry Smith } 742d00d2cf4SBarry Smith if (nofinalvalue) { 743c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 745c337ccceSJed Brown #else 7469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 747c337ccceSJed Brown #endif 748d00d2cf4SBarry Smith } 7499566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 752fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 75444cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 75660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 757aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 75836db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76036db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76236db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7646831982aSBarry Smith } 76544cd7ae7SLois Curfman McInnes #else 7669566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 76744cd7ae7SLois Curfman McInnes #endif 76844cd7ae7SLois Curfman McInnes } 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77044cd7ae7SLois Curfman McInnes } 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 772fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 77397f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 776496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 777496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 77860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 779496be53dSLois Curfman McInnes if (a->j[j] >= i) { 780aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78136db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 782496be53dSLois Curfman McInnes #else 783496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 784496be53dSLois Curfman McInnes #endif 785496be53dSLois Curfman McInnes } 786496be53dSLois Curfman McInnes } 787496be53dSLois Curfman McInnes } 7882e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7902e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7912205254eSKarl Rupp if (i + 4 < m) { 7929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 7932205254eSKarl Rupp } else if (i + 3 < m) { 7949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 7952205254eSKarl Rupp } else if (i + 2 < m) { 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 7972205254eSKarl Rupp } else if (i + 1 < m) { 7989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 7992205254eSKarl Rupp } else if (i < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8012205254eSKarl Rupp } else { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8032205254eSKarl Rupp } 804496be53dSLois Curfman McInnes } 8059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8069566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 807496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 80860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8099566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 810496be53dSLois Curfman McInnes } 8119566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 812496be53dSLois Curfman McInnes } 8139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 814496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 816496be53dSLois Curfman McInnes if (a->j[j] >= i) { 817aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 81848a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 819496be53dSLois Curfman McInnes #else 8209566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 821496be53dSLois Curfman McInnes #endif 822496be53dSLois Curfman McInnes } 823496be53dSLois Curfman McInnes } 8249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 825496be53dSLois Curfman McInnes } 8269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 827fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 82897f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 82987828ca2SBarry Smith PetscScalar value; 83068f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83168f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83268f1ed48SBarry Smith 83368f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 83468f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 83568f1ed48SBarry Smith realonly = PETSC_FALSE; 83668f1ed48SBarry Smith break; 83768f1ed48SBarry Smith } 83868f1ed48SBarry Smith } 83968f1ed48SBarry Smith #endif 84002594712SBarry Smith 8419566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84202594712SBarry Smith for (i = 0; i < m; i++) { 84302594712SBarry Smith jcnt = 0; 844d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 845e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 84602594712SBarry Smith value = a->a[cnt++]; 847e24b481bSBarry Smith jcnt++; 84802594712SBarry Smith } else { 84902594712SBarry Smith value = 0.0; 85002594712SBarry Smith } 851aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85268f1ed48SBarry Smith if (realonly) { 8539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 85468f1ed48SBarry Smith } else { 8559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 85668f1ed48SBarry Smith } 85702594712SBarry Smith #else 8589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 85902594712SBarry Smith #endif 86002594712SBarry Smith } 8619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86202594712SBarry Smith } 8639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8643c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 865150b93efSMatthew G. Knepley PetscInt fshift = 1; 8669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8673c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8693c215bfdSMatthew Knepley #else 8709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8713c215bfdSMatthew Knepley #endif 8729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8733c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 87460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8773c215bfdSMatthew Knepley #else 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8793c215bfdSMatthew Knepley #endif 8803c215bfdSMatthew Knepley } 8813c215bfdSMatthew Knepley } 8829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8833a40ed3dSBarry Smith } else { 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 885d5f3da31SBarry Smith if (A->factortype) { 88616cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 88816cd7e1dSShri Abhyankar /* L part */ 88960e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89116cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 89316cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 89516cd7e1dSShri Abhyankar } else { 8969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 89716cd7e1dSShri Abhyankar } 89816cd7e1dSShri Abhyankar #else 8999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90016cd7e1dSShri Abhyankar #endif 90116cd7e1dSShri Abhyankar } 90216cd7e1dSShri Abhyankar /* diagonal */ 90316cd7e1dSShri Abhyankar j = a->diag[i]; 90416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 90516cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 90716cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 90916cd7e1dSShri Abhyankar } else { 9109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91116cd7e1dSShri Abhyankar } 91216cd7e1dSShri Abhyankar #else 9139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 91416cd7e1dSShri Abhyankar #endif 91516cd7e1dSShri Abhyankar 91616cd7e1dSShri Abhyankar /* U part */ 91760e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 91816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9229566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 92316cd7e1dSShri Abhyankar } else { 9249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 92516cd7e1dSShri Abhyankar } 92616cd7e1dSShri Abhyankar #else 9279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 92816cd7e1dSShri Abhyankar #endif 92916cd7e1dSShri Abhyankar } 9309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93116cd7e1dSShri Abhyankar } 93216cd7e1dSShri Abhyankar } else { 93317ab2063SBarry Smith for (i = 0; i < m; i++) { 9349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 93560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 936aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 93736db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 93936db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9413a40ed3dSBarry Smith } else { 9429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 94317ab2063SBarry Smith } 94417ab2063SBarry Smith #else 9459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 94617ab2063SBarry Smith #endif 94717ab2063SBarry Smith } 9489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 94917ab2063SBarry Smith } 95016cd7e1dSShri Abhyankar } 9519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95217ab2063SBarry Smith } 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9543a40ed3dSBarry Smith PetscFunctionReturn(0); 955416022c9SBarry Smith } 956416022c9SBarry Smith 9579804daf3SBarry Smith #include <petscdraw.h> 958d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 959d71ae5a4SJacob Faibussowitsch { 960480ef9eaSBarry Smith Mat A = (Mat)Aa; 961416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 962383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 963383922c3SLisandro Dalcin int color; 964b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 965b0a32e0cSBarry Smith PetscViewer viewer; 966f3ef73ceSBarry Smith PetscViewerFormat format; 967fff043a9SJunchao Zhang const PetscScalar *aa; 968cddf8d76SBarry Smith 9693a40ed3dSBarry Smith PetscFunctionBegin; 9709566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9719566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9729566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 973383922c3SLisandro Dalcin 974416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 976fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 977d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9780513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 979b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 980416022c9SBarry Smith for (i = 0; i < m; i++) { 9819371c9d4SSatish Balay y_l = m - i - 1.0; 9829371c9d4SSatish Balay y_r = y_l + 1.0; 983bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9849371c9d4SSatish Balay x_l = a->j[j]; 9859371c9d4SSatish Balay x_r = x_l + 1.0; 986fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9879566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 988cddf8d76SBarry Smith } 989cddf8d76SBarry Smith } 990b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 991cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9929371c9d4SSatish Balay y_l = m - i - 1.0; 9939371c9d4SSatish Balay y_r = y_l + 1.0; 994bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9959371c9d4SSatish Balay x_l = a->j[j]; 9969371c9d4SSatish Balay x_r = x_l + 1.0; 997fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 9989566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 999cddf8d76SBarry Smith } 1000cddf8d76SBarry Smith } 1001b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1002cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10039371c9d4SSatish Balay y_l = m - i - 1.0; 10049371c9d4SSatish Balay y_r = y_l + 1.0; 1005bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10069371c9d4SSatish Balay x_l = a->j[j]; 10079371c9d4SSatish Balay x_r = x_l + 1.0; 1008fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10099566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1010416022c9SBarry Smith } 1011416022c9SBarry Smith } 1012d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10130513a670SBarry Smith } else { 10140513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10150513a670SBarry Smith /* first determine max of all nonzero values */ 1016b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1017383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1018b0a32e0cSBarry Smith PetscDraw popup; 10190513a670SBarry Smith 10200513a670SBarry Smith for (i = 0; i < nz; i++) { 1021fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10220513a670SBarry Smith } 1023383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10249566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10259566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1026383922c3SLisandro Dalcin 1027d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10280513a670SBarry Smith for (i = 0; i < m; i++) { 1029383922c3SLisandro Dalcin y_l = m - i - 1.0; 1030383922c3SLisandro Dalcin y_r = y_l + 1.0; 1031bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1032383922c3SLisandro Dalcin x_l = a->j[j]; 1033383922c3SLisandro Dalcin x_r = x_l + 1.0; 1034fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10359566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10360513a670SBarry Smith count++; 10370513a670SBarry Smith } 10380513a670SBarry Smith } 1039d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10400513a670SBarry Smith } 10419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1042480ef9eaSBarry Smith PetscFunctionReturn(0); 1043480ef9eaSBarry Smith } 1044cddf8d76SBarry Smith 10459804daf3SBarry Smith #include <petscdraw.h> 1046d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1047d71ae5a4SJacob Faibussowitsch { 1048b0a32e0cSBarry Smith PetscDraw draw; 104936db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1050ace3abfcSBarry Smith PetscBool isnull; 1051480ef9eaSBarry Smith 1052480ef9eaSBarry Smith PetscFunctionBegin; 10539566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10549566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 1055480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 1056480ef9eaSBarry Smith 10579371c9d4SSatish Balay xr = A->cmap->n; 10589371c9d4SSatish Balay yr = A->rmap->n; 10599371c9d4SSatish Balay h = yr / 10.0; 10609371c9d4SSatish Balay w = xr / 10.0; 10619371c9d4SSatish Balay xr += w; 10629371c9d4SSatish Balay yr += h; 10639371c9d4SSatish Balay xl = -w; 10649371c9d4SSatish Balay yl = -h; 10659566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10669566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10679566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10689566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10699566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10703a40ed3dSBarry Smith PetscFunctionReturn(0); 1071416022c9SBarry Smith } 1072416022c9SBarry Smith 1073d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1074d71ae5a4SJacob Faibussowitsch { 1075ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1076416022c9SBarry Smith 10773a40ed3dSBarry Smith PetscFunctionBegin; 10789566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10799566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10809566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10811baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10821baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10831baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10849566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10853a40ed3dSBarry Smith PetscFunctionReturn(0); 108617ab2063SBarry Smith } 108719bcc07fSBarry Smith 1088d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1089d71ae5a4SJacob Faibussowitsch { 1090416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1091580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1092d0f46423SBarry Smith PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0; 109354f21887SBarry Smith MatScalar *aa = a->a, *ap; 10943447b6efSHong Zhang PetscReal ratio = 0.6; 109517ab2063SBarry Smith 10963a40ed3dSBarry Smith PetscFunctionBegin; 10973a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 10989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1099b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1100b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11019566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 1102b215bc84SStefano Zampini PetscFunctionReturn(0); 1103b215bc84SStefano Zampini } 110417ab2063SBarry Smith 110543ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 110617ab2063SBarry Smith for (i = 1; i < m; i++) { 1107416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 110817ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 110994a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111017ab2063SBarry Smith if (fshift) { 1111bfeeae90SHong Zhang ip = aj + ai[i]; 1112bfeeae90SHong Zhang ap = aa + ai[i]; 111317ab2063SBarry Smith N = ailen[i]; 11149566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 111548a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 111617ab2063SBarry Smith } 111717ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 111817ab2063SBarry Smith } 111917ab2063SBarry Smith if (m) { 112017ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112117ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112217ab2063SBarry Smith } 112317ab2063SBarry Smith /* reset ilen and imax for each row */ 11247b083b7cSBarry Smith a->nonzerorowcnt = 0; 1125396832f4SHong Zhang if (A->structure_only) { 11269566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11279566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1128396832f4SHong Zhang } else { /* !A->structure_only */ 112917ab2063SBarry Smith for (i = 0; i < m; i++) { 113017ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11317b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113217ab2063SBarry Smith } 1133396832f4SHong Zhang } 1134bfeeae90SHong Zhang a->nz = ai[m]; 1135aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 113617ab2063SBarry Smith 11379566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 11389566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11399566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11409566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11412205254eSKarl Rupp 11428e58a170SBarry Smith A->info.mallocs += a->reallocs; 1143dd5f02e7SSatish Balay a->reallocs = 0; 11446712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 114536db0b34SBarry Smith a->rmax = rmax; 11464e220ebcSLois Curfman McInnes 114748a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11489566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11493a40ed3dSBarry Smith PetscFunctionReturn(0); 115017ab2063SBarry Smith } 115117ab2063SBarry Smith 1152d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1153d71ae5a4SJacob Faibussowitsch { 115499cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 115599cafbc1SBarry Smith PetscInt i, nz = a->nz; 11562e5835c6SStefano Zampini MatScalar *aa; 115799cafbc1SBarry Smith 115899cafbc1SBarry Smith PetscFunctionBegin; 11599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 116099cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 116399cafbc1SBarry Smith PetscFunctionReturn(0); 116499cafbc1SBarry Smith } 116599cafbc1SBarry Smith 1166d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1167d71ae5a4SJacob Faibussowitsch { 116899cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 116999cafbc1SBarry Smith PetscInt i, nz = a->nz; 11702e5835c6SStefano Zampini MatScalar *aa; 117199cafbc1SBarry Smith 117299cafbc1SBarry Smith PetscFunctionBegin; 11739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117499cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 117799cafbc1SBarry Smith PetscFunctionReturn(0); 117899cafbc1SBarry Smith } 117999cafbc1SBarry Smith 1180d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1181d71ae5a4SJacob Faibussowitsch { 1182fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1183fff043a9SJunchao Zhang MatScalar *aa; 11843a40ed3dSBarry Smith 11853a40ed3dSBarry Smith PetscFunctionBegin; 11869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 11879566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 11889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 11899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11903a40ed3dSBarry Smith PetscFunctionReturn(0); 119117ab2063SBarry Smith } 1192416022c9SBarry Smith 1193d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatResetPreallocationCOO_SeqAIJ(Mat A) 1194d71ae5a4SJacob Faibussowitsch { 1195cbc6b225SStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1196cbc6b225SStefano Zampini 1197cbc6b225SStefano Zampini PetscFunctionBegin; 11989566063dSJacob Faibussowitsch PetscCall(PetscFree(a->perm)); 11999566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jmap)); 1200cbc6b225SStefano Zampini PetscFunctionReturn(0); 1201cbc6b225SStefano Zampini } 1202cbc6b225SStefano Zampini 1203d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1204d71ae5a4SJacob Faibussowitsch { 1205416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1206d5d45c9bSBarry Smith 12073a40ed3dSBarry Smith PetscFunctionBegin; 1208aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1209c0aa6a63SJacob Faibussowitsch PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz); 121017ab2063SBarry Smith #endif 12119566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12129566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(A)); 12139566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12149566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12159566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12169566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12179566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12189566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12199566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12209566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12219566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12229566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12239566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12259566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12269566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1227901853e0SKris Buschelman 12286718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12296718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12306718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12316718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12326718818eSStefano Zampini due to different matrix sizes */ 12339566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12346718818eSStefano Zampini 12359566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12362e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12372e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12389566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12442e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12452e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12462e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12472e956fe4SStefano Zampini #endif 12484222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12524222ddf1SHong Zhang #endif 12533d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12553d0639e7SStefano Zampini #endif 12569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1257af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1259af8000cdSHong Zhang #endif 1260d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1262d24d4204SJose E. Roman #endif 126363c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 126663c07aadSStefano Zampini #endif 12679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12689566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12712e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12729566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12822e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12832e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12842e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12852e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 12862e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 12872e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 12882e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 12893a40ed3dSBarry Smith PetscFunctionReturn(0); 129017ab2063SBarry Smith } 129117ab2063SBarry Smith 1292d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1293d71ae5a4SJacob Faibussowitsch { 1294416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 12953a40ed3dSBarry Smith 12963a40ed3dSBarry Smith PetscFunctionBegin; 1297a65d3064SKris Buschelman switch (op) { 1298d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1299d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1300d71ae5a4SJacob Faibussowitsch break; 1301d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1302d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1303d71ae5a4SJacob Faibussowitsch break; 1304d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1305d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1306d71ae5a4SJacob Faibussowitsch break; 1307d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1308d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1309d71ae5a4SJacob Faibussowitsch break; 1310d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1311d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1312d71ae5a4SJacob Faibussowitsch break; 1313d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1314d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1315d71ae5a4SJacob Faibussowitsch break; 1316d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1317d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1318d71ae5a4SJacob Faibussowitsch break; 13193d472b54SHong Zhang case MAT_SPD: 1320b1646e73SJed Brown case MAT_SYMMETRIC: 1321b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1322b1646e73SJed Brown case MAT_HERMITIAN: 1323b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1324957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1325b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1326b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1327b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13285021d80fSJed Brown break; 13298c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1330a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1331d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1332d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1333d71ae5a4SJacob Faibussowitsch break; 1334d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1335d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1336d71ae5a4SJacob Faibussowitsch break; 1337d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1338d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1339d71ae5a4SJacob Faibussowitsch break; 1340071fcb05SBarry Smith case MAT_SORTED_FULL: 1341071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1342071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1343071fcb05SBarry Smith break; 1344d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1345d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1346d71ae5a4SJacob Faibussowitsch break; 1347d71ae5a4SJacob Faibussowitsch default: 1348d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1349a65d3064SKris Buschelman } 13503a40ed3dSBarry Smith PetscFunctionReturn(0); 135117ab2063SBarry Smith } 135217ab2063SBarry Smith 1353d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1354d71ae5a4SJacob Faibussowitsch { 1355416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1356fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1357c898d852SStefano Zampini PetscScalar *x; 1358c898d852SStefano Zampini const PetscScalar *aa; 135917ab2063SBarry Smith 13603a40ed3dSBarry Smith PetscFunctionBegin; 13619566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 136208401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1364d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1365d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13669566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13672c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13689566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 137035e7444dSHong Zhang PetscFunctionReturn(0); 137135e7444dSHong Zhang } 137235e7444dSHong Zhang 13739566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 137435e7444dSHong Zhang for (i = 0; i < n; i++) { 1375fdc842d1SBarry Smith x[i] = 0.0; 137635e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 137735e7444dSHong Zhang if (aj[j] == i) { 137835e7444dSHong Zhang x[i] = aa[j]; 137917ab2063SBarry Smith break; 138017ab2063SBarry Smith } 138117ab2063SBarry Smith } 138217ab2063SBarry Smith } 13839566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13853a40ed3dSBarry Smith PetscFunctionReturn(0); 138617ab2063SBarry Smith } 138717ab2063SBarry Smith 1388c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1389d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1390d71ae5a4SJacob Faibussowitsch { 1391416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13925f22a7b3SSebastian Grimberg const MatScalar *aa; 1393d9ca1df4SBarry Smith PetscScalar *y; 1394d9ca1df4SBarry Smith const PetscScalar *x; 1395d0f46423SBarry Smith PetscInt m = A->rmap->n; 13965c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 13975f22a7b3SSebastian Grimberg const MatScalar *v; 1398a77337e4SBarry Smith PetscScalar alpha; 1399d9ca1df4SBarry Smith PetscInt n, i, j; 1400d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14013447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1402ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14035c897100SBarry Smith #endif 140417ab2063SBarry Smith 14053a40ed3dSBarry Smith PetscFunctionBegin; 14069566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14079566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14089566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14105c897100SBarry Smith 14115c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1412fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14135c897100SBarry Smith #else 14143447b6efSHong Zhang if (usecprow) { 14153447b6efSHong Zhang m = cprow.nrows; 14163447b6efSHong Zhang ii = cprow.i; 14177b2bb3b9SHong Zhang ridx = cprow.rindex; 14183447b6efSHong Zhang } else { 14193447b6efSHong Zhang ii = a->i; 14203447b6efSHong Zhang } 142117ab2063SBarry Smith for (i = 0; i < m; i++) { 14223447b6efSHong Zhang idx = a->j + ii[i]; 1423fff043a9SJunchao Zhang v = aa + ii[i]; 14243447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14253447b6efSHong Zhang if (usecprow) { 14267b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14273447b6efSHong Zhang } else { 142817ab2063SBarry Smith alpha = x[i]; 14293447b6efSHong Zhang } 143004fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 143117ab2063SBarry Smith } 14325c897100SBarry Smith #endif 14339566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14349566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14359566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14373a40ed3dSBarry Smith PetscFunctionReturn(0); 143817ab2063SBarry Smith } 143917ab2063SBarry Smith 1440d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1441d71ae5a4SJacob Faibussowitsch { 14425c897100SBarry Smith PetscFunctionBegin; 14439566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14449566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14455c897100SBarry Smith PetscFunctionReturn(0); 14465c897100SBarry Smith } 14475c897100SBarry Smith 1448c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 144978b84d54SShri Abhyankar 1450d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1451d71ae5a4SJacob Faibussowitsch { 1452416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1453d9fead3dSBarry Smith PetscScalar *y; 145454f21887SBarry Smith const PetscScalar *x; 1455fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1456003131ecSBarry Smith PetscInt m = A->rmap->n; 14570298fd71SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 14587b083b7cSBarry Smith PetscInt n, i; 1459362ced78SSatish Balay PetscScalar sum; 1460ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 146117ab2063SBarry Smith 1462b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 146397952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1464fee21e36SBarry Smith #endif 1465fee21e36SBarry Smith 14663a40ed3dSBarry Smith PetscFunctionBegin; 1467b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14689566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 1469b215bc84SStefano Zampini PetscFunctionReturn(0); 1470b215bc84SStefano Zampini } 14719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14729566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14739566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1474416022c9SBarry Smith ii = a->i; 14754eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14769566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 147797952fefSHong Zhang m = a->compressedrow.nrows; 147897952fefSHong Zhang ii = a->compressedrow.i; 147997952fefSHong Zhang ridx = a->compressedrow.rindex; 148097952fefSHong Zhang for (i = 0; i < m; i++) { 148197952fefSHong Zhang n = ii[i + 1] - ii[i]; 148297952fefSHong Zhang aj = a->j + ii[i]; 1483fff043a9SJunchao Zhang aa = a_a + ii[i]; 148497952fefSHong Zhang sum = 0.0; 1485003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1486003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 148797952fefSHong Zhang y[*ridx++] = sum; 148897952fefSHong Zhang } 148997952fefSHong Zhang } else { /* do not use compressed row format */ 1490b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 14913d3eaba7SBarry Smith aj = a->j; 1492fff043a9SJunchao Zhang aa = a_a; 1493b05257ddSBarry Smith fortranmultaij_(&m, x, ii, aj, aa, y); 1494b05257ddSBarry Smith #else 149517ab2063SBarry Smith for (i = 0; i < m; i++) { 1496003131ecSBarry Smith n = ii[i + 1] - ii[i]; 1497003131ecSBarry Smith aj = a->j + ii[i]; 1498fff043a9SJunchao Zhang aa = a_a + ii[i]; 149917ab2063SBarry Smith sum = 0.0; 1500003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 150117ab2063SBarry Smith y[i] = sum; 150217ab2063SBarry Smith } 15038d195f9aSBarry Smith #endif 1504b05257ddSBarry Smith } 15059566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15069566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15079566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15093a40ed3dSBarry Smith PetscFunctionReturn(0); 151017ab2063SBarry Smith } 151117ab2063SBarry Smith 1512d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1513d71ae5a4SJacob Faibussowitsch { 1514b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1515b434eb95SMatthew G. Knepley PetscScalar *y; 1516b434eb95SMatthew G. Knepley const PetscScalar *x; 1517fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1518b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1519b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1520b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1521b434eb95SMatthew G. Knepley PetscScalar sum; 1522b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1523b434eb95SMatthew G. Knepley 1524b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1525b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1526b434eb95SMatthew G. Knepley #endif 1527b434eb95SMatthew G. Knepley 1528b434eb95SMatthew G. Knepley PetscFunctionBegin; 15299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15309566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15319566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1532b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1533b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1534b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1535b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1536b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1537b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1538b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1539fff043a9SJunchao Zhang aa = a_a + ii[i]; 1540b434eb95SMatthew G. Knepley sum = 0.0; 1541b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1542b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1543b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1544b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1545b434eb95SMatthew G. Knepley } 1546b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15473d3eaba7SBarry Smith ii = a->i; 1548b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1549b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1550b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1551fff043a9SJunchao Zhang aa = a_a + ii[i]; 1552b434eb95SMatthew G. Knepley sum = 0.0; 1553b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1554b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1555b434eb95SMatthew G. Knepley y[i] = sum; 1556b434eb95SMatthew G. Knepley } 1557b434eb95SMatthew G. Knepley } 15589566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15599566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15609566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 1562b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1563b434eb95SMatthew G. Knepley } 1564b434eb95SMatthew G. Knepley 1565d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1566d71ae5a4SJacob Faibussowitsch { 1567b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1568b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1569b434eb95SMatthew G. Knepley const PetscScalar *x; 1570fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1571b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1572b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1573b434eb95SMatthew G. Knepley PetscScalar sum; 1574b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1575b434eb95SMatthew G. Knepley 1576b434eb95SMatthew G. Knepley PetscFunctionBegin; 15779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15789566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15799566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1580b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 158148a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1582b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1583b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1584b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1585b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1586b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1587b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1588fff043a9SJunchao Zhang aa = a_a + ii[i]; 1589b434eb95SMatthew G. Knepley sum = y[*ridx]; 1590b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1591b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1592b434eb95SMatthew G. Knepley } 1593b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15943d3eaba7SBarry Smith ii = a->i; 1595b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1596b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1597b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1598fff043a9SJunchao Zhang aa = a_a + ii[i]; 1599b434eb95SMatthew G. Knepley sum = y[i]; 1600b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1601b434eb95SMatthew G. Knepley z[i] = sum; 1602b434eb95SMatthew G. Knepley } 1603b434eb95SMatthew G. Knepley } 16049566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16059566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16069566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 1608b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1609b434eb95SMatthew G. Knepley } 1610b434eb95SMatthew G. Knepley 1611c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1612d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1613d71ae5a4SJacob Faibussowitsch { 1614416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1615f15663dcSBarry Smith PetscScalar *y, *z; 1616f15663dcSBarry Smith const PetscScalar *x; 1617fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1618d9ca1df4SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 1619d9ca1df4SBarry Smith PetscInt m = A->rmap->n, n, i; 1620362ced78SSatish Balay PetscScalar sum; 1621ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16229ea0dfa2SSatish Balay 16233a40ed3dSBarry Smith PetscFunctionBegin; 1624b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16259566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 1626b215bc84SStefano Zampini PetscFunctionReturn(0); 1627b215bc84SStefano Zampini } 16289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16299566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16309566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16314eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 163248a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 163397952fefSHong Zhang m = a->compressedrow.nrows; 163497952fefSHong Zhang ii = a->compressedrow.i; 163597952fefSHong Zhang ridx = a->compressedrow.rindex; 163697952fefSHong Zhang for (i = 0; i < m; i++) { 163797952fefSHong Zhang n = ii[i + 1] - ii[i]; 163897952fefSHong Zhang aj = a->j + ii[i]; 1639fff043a9SJunchao Zhang aa = a_a + ii[i]; 164097952fefSHong Zhang sum = y[*ridx]; 1641f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 164297952fefSHong Zhang z[*ridx++] = sum; 164397952fefSHong Zhang } 164497952fefSHong Zhang } else { /* do not use compressed row format */ 16453d3eaba7SBarry Smith ii = a->i; 1646f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16473d3eaba7SBarry Smith aj = a->j; 1648fff043a9SJunchao Zhang aa = a_a; 1649f15663dcSBarry Smith fortranmultaddaij_(&m, x, ii, aj, aa, y, z); 1650f15663dcSBarry Smith #else 165117ab2063SBarry Smith for (i = 0; i < m; i++) { 1652f15663dcSBarry Smith n = ii[i + 1] - ii[i]; 1653f15663dcSBarry Smith aj = a->j + ii[i]; 1654fff043a9SJunchao Zhang aa = a_a + ii[i]; 165517ab2063SBarry Smith sum = y[i]; 1656f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165717ab2063SBarry Smith z[i] = sum; 165817ab2063SBarry Smith } 165902ab625aSSatish Balay #endif 1660f15663dcSBarry Smith } 16619566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16629566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16639566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16653a40ed3dSBarry Smith PetscFunctionReturn(0); 166617ab2063SBarry Smith } 166717ab2063SBarry Smith 166817ab2063SBarry Smith /* 166917ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 167017ab2063SBarry Smith */ 1671d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1672d71ae5a4SJacob Faibussowitsch { 1673416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1674d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1675c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 167617ab2063SBarry Smith 16773a40ed3dSBarry Smith PetscFunctionBegin; 167809f38230SBarry Smith if (!a->diag) { 16799566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1680c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 168109f38230SBarry Smith } 1682d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1683c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1684c0c07093SJunchao Zhang if (alreadySet) { 1685c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1686c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1687c0c07093SJunchao Zhang } 1688c0c07093SJunchao Zhang 168909f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1690bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1691bfeeae90SHong Zhang if (a->j[j] == i) { 169209f38230SBarry Smith a->diag[i] = j; 169317ab2063SBarry Smith break; 169417ab2063SBarry Smith } 169517ab2063SBarry Smith } 169617ab2063SBarry Smith } 16973a40ed3dSBarry Smith PetscFunctionReturn(0); 169817ab2063SBarry Smith } 169917ab2063SBarry Smith 1700d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1701d71ae5a4SJacob Faibussowitsch { 170261ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 170361ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 170461ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 170561ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 170661ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 170761ecd0c6SBarry Smith 170861ecd0c6SBarry Smith PetscFunctionBegin; 170961ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17119566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 171261ecd0c6SBarry Smith PetscFunctionReturn(0); 171361ecd0c6SBarry Smith } 171461ecd0c6SBarry Smith 171561ecd0c6SBarry Smith if (a->diagonaldense) { 171661ecd0c6SBarry Smith cnt = 0; 171761ecd0c6SBarry Smith } else { 17189566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 171961ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1720349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 172161ecd0c6SBarry Smith cnt++; 172261ecd0c6SBarry Smith mdiag[i] = 1; 172361ecd0c6SBarry Smith } 172461ecd0c6SBarry Smith } 172561ecd0c6SBarry Smith } 172661ecd0c6SBarry Smith if (!cnt) { 17279566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 172861ecd0c6SBarry Smith } else { 1729b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1730b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 173161ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij; 173261ecd0c6SBarry Smith 173361ecd0c6SBarry Smith a->a = NULL; 173461ecd0c6SBarry Smith a->j = NULL; 173561ecd0c6SBarry Smith a->i = NULL; 173661ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1737ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 173961ecd0c6SBarry Smith 174061ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 174161ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17429566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 174348a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1744447d62f5SStefano Zampini } 17459566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17469566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 174761ecd0c6SBarry Smith if (singlemalloc) { 17489566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda, oldj, oldi)); 174961ecd0c6SBarry Smith } else { 17509566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17519566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17529566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 175361ecd0c6SBarry Smith } 175461ecd0c6SBarry Smith } 17559566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 175661ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 175761ecd0c6SBarry Smith PetscFunctionReturn(0); 175861ecd0c6SBarry Smith } 175961ecd0c6SBarry Smith 1760be5855fcSBarry Smith /* 1761be5855fcSBarry Smith Checks for missing diagonals 1762be5855fcSBarry Smith */ 1763d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1764d71ae5a4SJacob Faibussowitsch { 1765be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17667734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1767be5855fcSBarry Smith 1768be5855fcSBarry Smith PetscFunctionBegin; 176909f38230SBarry Smith *missing = PETSC_FALSE; 17707734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 177109f38230SBarry Smith *missing = PETSC_TRUE; 177209f38230SBarry Smith if (d) *d = 0; 17739566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 177409f38230SBarry Smith } else { 177501445905SHong Zhang PetscInt n; 177601445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1777f1e2ffcdSBarry Smith diag = a->diag; 177801445905SHong Zhang for (i = 0; i < n; i++) { 17797734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 178009f38230SBarry Smith *missing = PETSC_TRUE; 178109f38230SBarry Smith if (d) *d = i; 17829566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1783358d2f5dSShri Abhyankar break; 178409f38230SBarry Smith } 1785be5855fcSBarry Smith } 1786be5855fcSBarry Smith } 1787be5855fcSBarry Smith PetscFunctionReturn(0); 1788be5855fcSBarry Smith } 1789be5855fcSBarry Smith 17900da83c2eSBarry Smith #include <petscblaslapack.h> 17910da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 17920da83c2eSBarry Smith 17930da83c2eSBarry Smith /* 17940da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 17950da83c2eSBarry Smith */ 1796d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1797d71ae5a4SJacob Faibussowitsch { 17980da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 17990da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18000da83c2eSBarry Smith const PetscReal shift = 0.0; 18010da83c2eSBarry Smith PetscInt ipvt[5]; 18020da83c2eSBarry Smith PetscScalar work[25], *v_work; 18030da83c2eSBarry Smith 18040da83c2eSBarry Smith PetscFunctionBegin; 18050da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18060da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 180708401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1808ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18099566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 181048a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18110da83c2eSBarry Smith ncnt = 0; 18120da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18130da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18149566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18150da83c2eSBarry Smith switch (bsizes[i]) { 1816d71ae5a4SJacob Faibussowitsch case 1: 1817d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1818d71ae5a4SJacob Faibussowitsch break; 18190da83c2eSBarry Smith case 2: 18209566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18210da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18229566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18230da83c2eSBarry Smith break; 18240da83c2eSBarry Smith case 3: 18259566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18260da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18279566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18280da83c2eSBarry Smith break; 18290da83c2eSBarry Smith case 4: 18309566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18310da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18329566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18330da83c2eSBarry Smith break; 18340da83c2eSBarry Smith case 5: 18359566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18360da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18379566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18380da83c2eSBarry Smith break; 18390da83c2eSBarry Smith case 6: 18409566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18410da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18429566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18430da83c2eSBarry Smith break; 18440da83c2eSBarry Smith case 7: 18459566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18460da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18480da83c2eSBarry Smith break; 18490da83c2eSBarry Smith default: 18509566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18510da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18529566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18530da83c2eSBarry Smith } 18540da83c2eSBarry Smith ncnt += bsizes[i]; 18550da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 18560da83c2eSBarry Smith } 185748a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18589566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18590da83c2eSBarry Smith PetscFunctionReturn(0); 18600da83c2eSBarry Smith } 18610da83c2eSBarry Smith 1862422a814eSBarry Smith /* 1863422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1864422a814eSBarry Smith */ 1865d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1866d71ae5a4SJacob Faibussowitsch { 186771f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1868d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18692e5835c6SStefano Zampini const MatScalar *v; 187054f21887SBarry Smith PetscScalar *idiag, *mdiag; 187171f1c65dSBarry Smith 187271f1c65dSBarry Smith PetscFunctionBegin; 187371f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 18749566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 187571f1c65dSBarry Smith diag = a->diag; 18764dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18772e5835c6SStefano Zampini 187871f1c65dSBarry Smith mdiag = a->mdiag; 187971f1c65dSBarry Smith idiag = a->idiag; 18809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1881422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 188271f1c65dSBarry Smith for (i = 0; i < m; i++) { 188371f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1884899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1885899639b0SHong Zhang if (PetscRealPart(fshift)) { 18869566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 18877b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18887b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 18897b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 189098921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1891899639b0SHong Zhang } 189271f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 189371f1c65dSBarry Smith } 18949566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 189571f1c65dSBarry Smith } else { 189671f1c65dSBarry Smith for (i = 0; i < m; i++) { 189771f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 189871f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 189971f1c65dSBarry Smith } 19009566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 190171f1c65dSBarry Smith } 190271f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 190471f1c65dSBarry Smith PetscFunctionReturn(0); 190571f1c65dSBarry Smith } 190671f1c65dSBarry Smith 1907c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 1908d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1909d71ae5a4SJacob Faibussowitsch { 1910416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1911e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19122e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 191354f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19143d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 191597f1f81fSBarry Smith const PetscInt *idx, *diag; 191617ab2063SBarry Smith 19173a40ed3dSBarry Smith PetscFunctionBegin; 1918b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19199566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 1920b215bc84SStefano Zampini PetscFunctionReturn(0); 1921b215bc84SStefano Zampini } 1922b965ef7fSBarry Smith its = its * lits; 192391723122SBarry Smith 192471f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19259566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 192671f1c65dSBarry Smith a->fshift = fshift; 192771f1c65dSBarry Smith a->omega = omega; 1928ed480e8bSBarry Smith 192971f1c65dSBarry Smith diag = a->diag; 193071f1c65dSBarry Smith t = a->ssor_work; 1931ed480e8bSBarry Smith idiag = a->idiag; 193271f1c65dSBarry Smith mdiag = a->mdiag; 1933ed480e8bSBarry Smith 19349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19359566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19369566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1937ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 193817ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 193917ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1940ed480e8bSBarry Smith bs = b; 194117ab2063SBarry Smith for (i = 0; i < m; i++) { 194271f1c65dSBarry Smith d = fshift + mdiag[i]; 1943416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1944ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19452e5835c6SStefano Zampini v = aa + diag[i] + 1; 194617ab2063SBarry Smith sum = b[i] * d / omega; 1947003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 194817ab2063SBarry Smith x[i] = sum; 194917ab2063SBarry Smith } 19509566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19519566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19539566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19543a40ed3dSBarry Smith PetscFunctionReturn(0); 195517ab2063SBarry Smith } 1956c783ea89SBarry Smith 195708401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1958f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19594c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1960887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 196117ab2063SBarry Smith 196217ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 196317ab2063SBarry Smith 1964887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 196517ab2063SBarry Smith */ 196617ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 196717ab2063SBarry Smith 196817ab2063SBarry Smith /* x = (E + U)^{-1} b */ 196917ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1970416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1971ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19722e5835c6SStefano Zampini v = aa + diag[i] + 1; 197317ab2063SBarry Smith sum = b[i]; 1974e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1975ed480e8bSBarry Smith x[i] = sum * idiag[i]; 197617ab2063SBarry Smith } 197717ab2063SBarry Smith 197817ab2063SBarry Smith /* t = b - (2*E - D)x */ 19792e5835c6SStefano Zampini v = aa; 19802205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 198117ab2063SBarry Smith 198217ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1983ed480e8bSBarry Smith ts = t; 1984416022c9SBarry Smith diag = a->diag; 198517ab2063SBarry Smith for (i = 0; i < m; i++) { 1986416022c9SBarry Smith n = diag[i] - a->i[i]; 1987ed480e8bSBarry Smith idx = a->j + a->i[i]; 19882e5835c6SStefano Zampini v = aa + a->i[i]; 198917ab2063SBarry Smith sum = t[i]; 1990003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 1991ed480e8bSBarry Smith t[i] = sum * idiag[i]; 1992733d66baSBarry Smith /* x = x + t */ 1993733d66baSBarry Smith x[i] += t[i]; 199417ab2063SBarry Smith } 199517ab2063SBarry Smith 19969566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 19979566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19989566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19993a40ed3dSBarry Smith PetscFunctionReturn(0); 200017ab2063SBarry Smith } 200117ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 200217ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 200317ab2063SBarry Smith for (i = 0; i < m; i++) { 2004416022c9SBarry Smith n = diag[i] - a->i[i]; 2005ed480e8bSBarry Smith idx = a->j + a->i[i]; 20062e5835c6SStefano Zampini v = aa + a->i[i]; 200717ab2063SBarry Smith sum = b[i]; 2008e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20095c99c7daSBarry Smith t[i] = sum; 2010ed480e8bSBarry Smith x[i] = sum * idiag[i]; 201117ab2063SBarry Smith } 20125c99c7daSBarry Smith xb = t; 20139566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20143a40ed3dSBarry Smith } else xb = b; 201517ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 201617ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2017416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2018ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20192e5835c6SStefano Zampini v = aa + diag[i] + 1; 202017ab2063SBarry Smith sum = xb[i]; 2021e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20225c99c7daSBarry Smith if (xb == b) { 2023ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20245c99c7daSBarry Smith } else { 2025b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 202617ab2063SBarry Smith } 20275c99c7daSBarry Smith } 20289566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 202917ab2063SBarry Smith } 203017ab2063SBarry Smith its--; 203117ab2063SBarry Smith } 203217ab2063SBarry Smith while (its--) { 203317ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 203417ab2063SBarry Smith for (i = 0; i < m; i++) { 2035b19a5dc2SMark Adams /* lower */ 2036b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2037ed480e8bSBarry Smith idx = a->j + a->i[i]; 20382e5835c6SStefano Zampini v = aa + a->i[i]; 203917ab2063SBarry Smith sum = b[i]; 2040e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2041b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2042b19a5dc2SMark Adams /* upper */ 2043b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2044b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20452e5835c6SStefano Zampini v = aa + diag[i] + 1; 2046b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2047b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 204817ab2063SBarry Smith } 2049b19a5dc2SMark Adams xb = t; 20509566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2051b19a5dc2SMark Adams } else xb = b; 205217ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 205317ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2054b19a5dc2SMark Adams sum = xb[i]; 2055b19a5dc2SMark Adams if (xb == b) { 2056b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2057416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2058ed480e8bSBarry Smith idx = a->j + a->i[i]; 20592e5835c6SStefano Zampini v = aa + a->i[i]; 2060e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2061ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2062b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2063b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2064b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20652e5835c6SStefano Zampini v = aa + diag[i] + 1; 2066b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2067b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 206817ab2063SBarry Smith } 2069b19a5dc2SMark Adams } 2070b19a5dc2SMark Adams if (xb == b) { 20719566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2072b19a5dc2SMark Adams } else { 20739566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2074b19a5dc2SMark Adams } 207517ab2063SBarry Smith } 207617ab2063SBarry Smith } 20779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20789566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20799566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 2080365a8a9eSBarry Smith PetscFunctionReturn(0); 208117ab2063SBarry Smith } 208217ab2063SBarry Smith 2083d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2084d71ae5a4SJacob Faibussowitsch { 2085416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 20864e220ebcSLois Curfman McInnes 20873a40ed3dSBarry Smith PetscFunctionBegin; 20884e220ebcSLois Curfman McInnes info->block_size = 1.0; 20893966268fSBarry Smith info->nz_allocated = a->maxnz; 20903966268fSBarry Smith info->nz_used = a->nz; 20913966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 20923966268fSBarry Smith info->assemblies = A->num_ass; 20933966268fSBarry Smith info->mallocs = A->info.mallocs; 20944dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2095d5f3da31SBarry Smith if (A->factortype) { 20964e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 20974e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 20984e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 20994e220ebcSLois Curfman McInnes } else { 21004e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21014e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21024e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21034e220ebcSLois Curfman McInnes } 21043a40ed3dSBarry Smith PetscFunctionReturn(0); 210517ab2063SBarry Smith } 210617ab2063SBarry Smith 2107d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2108d71ae5a4SJacob Faibussowitsch { 2109416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2110c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 211197b48c8fSBarry Smith const PetscScalar *xx; 21122e5835c6SStefano Zampini PetscScalar *bb, *aa; 2113c7da8527SEric Chamberland PetscInt d = 0; 211417ab2063SBarry Smith 21153a40ed3dSBarry Smith PetscFunctionBegin; 211697b48c8fSBarry Smith if (x && b) { 21179566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21189566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 211997b48c8fSBarry Smith for (i = 0; i < N; i++) { 2120aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2121447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 212297b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 212397b48c8fSBarry Smith } 21249566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21259566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 212697b48c8fSBarry Smith } 212797b48c8fSBarry Smith 21289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2129a9817697SBarry Smith if (a->keepnonzeropattern) { 2130f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2131aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21329566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2133f1e2ffcdSBarry Smith } 2134f4df32b1SMatthew Knepley if (diag != 0.0) { 2135c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2136c7da8527SEric Chamberland d = rows[i]; 2137447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 213808401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2139c7da8527SEric Chamberland } 2140f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2141447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21422e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2143f1e2ffcdSBarry Smith } 2144f1e2ffcdSBarry Smith } 2145f1e2ffcdSBarry Smith } else { 2146f4df32b1SMatthew Knepley if (diag != 0.0) { 214717ab2063SBarry Smith for (i = 0; i < N; i++) { 2148aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21497ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2150447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2151447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2152447d62f5SStefano Zampini } else { 2153416022c9SBarry Smith a->ilen[rows[i]] = 1; 21542e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2155bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2156447d62f5SStefano Zampini } 2157447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21589566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 215917ab2063SBarry Smith } 216017ab2063SBarry Smith } 21613a40ed3dSBarry Smith } else { 216217ab2063SBarry Smith for (i = 0; i < N; i++) { 2163aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2164416022c9SBarry Smith a->ilen[rows[i]] = 0; 216517ab2063SBarry Smith } 216617ab2063SBarry Smith } 2167e56f5c9eSBarry Smith A->nonzerostate++; 2168f1e2ffcdSBarry Smith } 21699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2170dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21713a40ed3dSBarry Smith PetscFunctionReturn(0); 217217ab2063SBarry Smith } 217317ab2063SBarry Smith 2174d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2175d71ae5a4SJacob Faibussowitsch { 21766e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21776e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21782b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 21796e169961SBarry Smith const PetscScalar *xx; 21802e5835c6SStefano Zampini PetscScalar *bb, *aa; 21816e169961SBarry Smith 21826e169961SBarry Smith PetscFunctionBegin; 21832e5835c6SStefano Zampini if (!N) PetscFunctionReturn(0); 21849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 21856e169961SBarry Smith if (x && b) { 21869566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21879566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 21882b40b63fSBarry Smith vecs = PETSC_TRUE; 21896e169961SBarry Smith } 21909566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 21916e169961SBarry Smith for (i = 0; i < N; i++) { 2192aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21939566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 21942205254eSKarl Rupp 21956e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 21966e169961SBarry Smith } 21976e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 21986e169961SBarry Smith if (!zeroed[i]) { 21996e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22004cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22012e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22022e5835c6SStefano Zampini aa[j] = 0.0; 22036e169961SBarry Smith } 22046e169961SBarry Smith } 22054cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22066e169961SBarry Smith } 22076e169961SBarry Smith if (x && b) { 22089566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22099566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22106e169961SBarry Smith } 22119566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22126e169961SBarry Smith if (diag != 0.0) { 22139566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22141d5a398dSstefano_zampini if (missing) { 22151d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22164cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2217aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22189566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22191d5a398dSstefano_zampini } 22201d5a398dSstefano_zampini } else { 2221ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22226e169961SBarry Smith } 22231d5a398dSstefano_zampini } 22249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2225dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22266e169961SBarry Smith PetscFunctionReturn(0); 22276e169961SBarry Smith } 22286e169961SBarry Smith 2229d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2230d71ae5a4SJacob Faibussowitsch { 2231fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2232fff043a9SJunchao Zhang const PetscScalar *aa; 2233fff043a9SJunchao Zhang PetscInt *itmp; 223417ab2063SBarry Smith 22353a40ed3dSBarry Smith PetscFunctionBegin; 22369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2237416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22382e5835c6SStefano Zampini if (v) *v = (PetscScalar *)(aa + a->i[row]); 223917ab2063SBarry Smith if (idx) { 2240bfeeae90SHong Zhang itmp = a->j + a->i[row]; 224126fbe8dcSKarl Rupp if (*nz) *idx = itmp; 2242f4259b30SLisandro Dalcin else *idx = NULL; 224317ab2063SBarry Smith } 22449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22453a40ed3dSBarry Smith PetscFunctionReturn(0); 224617ab2063SBarry Smith } 224717ab2063SBarry Smith 2248d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2249d71ae5a4SJacob Faibussowitsch { 22503a40ed3dSBarry Smith PetscFunctionBegin; 2251cb4a9cd9SHong Zhang if (nz) *nz = 0; 22522e5835c6SStefano Zampini if (idx) *idx = NULL; 22532e5835c6SStefano Zampini if (v) *v = NULL; 22543a40ed3dSBarry Smith PetscFunctionReturn(0); 225517ab2063SBarry Smith } 225617ab2063SBarry Smith 2257d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2258d71ae5a4SJacob Faibussowitsch { 2259416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22602e5835c6SStefano Zampini const MatScalar *v; 226136db0b34SBarry Smith PetscReal sum = 0.0; 226297f1f81fSBarry Smith PetscInt i, j; 226317ab2063SBarry Smith 22643a40ed3dSBarry Smith PetscFunctionBegin; 22659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 226617ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2267570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2268570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2269792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2270570b7f6dSBarry Smith #else 2271416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22729371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22739371c9d4SSatish Balay v++; 227417ab2063SBarry Smith } 22758f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2276570b7f6dSBarry Smith #endif 22779566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22783a40ed3dSBarry Smith } else if (type == NORM_1) { 227936db0b34SBarry Smith PetscReal *tmp; 228097f1f81fSBarry Smith PetscInt *jj = a->j; 22819566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2282064f8208SBarry Smith *nrm = 0.0; 2283416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 22849371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 22859371c9d4SSatish Balay v++; 228617ab2063SBarry Smith } 2287d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2288064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 228917ab2063SBarry Smith } 22909566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 22919566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 22923a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2293064f8208SBarry Smith *nrm = 0.0; 2294d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 22952e5835c6SStefano Zampini const PetscScalar *v2 = v + a->i[j]; 229617ab2063SBarry Smith sum = 0.0; 2297416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 22989371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 22999371c9d4SSatish Balay v2++; 230017ab2063SBarry Smith } 2301064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 230217ab2063SBarry Smith } 23039566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2304f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23063a40ed3dSBarry Smith PetscFunctionReturn(0); 230717ab2063SBarry Smith } 230817ab2063SBarry Smith 2309d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2310d71ae5a4SJacob Faibussowitsch { 23113d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 231254f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23132e5835c6SStefano Zampini const MatScalar *va, *vb; 231497f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2315cd0d46ebSvictorle 2316cd0d46ebSvictorle PetscFunctionBegin; 23179566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23189566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23195485867bSBarry Smith if (ma != nb || na != mb) { 23205485867bSBarry Smith *f = PETSC_FALSE; 23215485867bSBarry Smith PetscFunctionReturn(0); 23225485867bSBarry Smith } 23239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23259371c9d4SSatish Balay aii = aij->i; 23269371c9d4SSatish Balay bii = bij->i; 23279371c9d4SSatish Balay adx = aij->j; 23289371c9d4SSatish Balay bdx = bij->j; 23299566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23309566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2331cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2332cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2333cd0d46ebSvictorle 2334cd0d46ebSvictorle *f = PETSC_TRUE; 2335cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2336cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 233797f1f81fSBarry Smith PetscInt idc, idr; 23385485867bSBarry Smith PetscScalar vc, vr; 2339cd0d46ebSvictorle /* column/row index/value */ 23405485867bSBarry Smith idc = adx[aptr[i]]; 23415485867bSBarry Smith idr = bdx[bptr[idc]]; 23425485867bSBarry Smith vc = va[aptr[i]]; 23435485867bSBarry Smith vr = vb[bptr[idc]]; 23445485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23455485867bSBarry Smith *f = PETSC_FALSE; 23465485867bSBarry Smith goto done; 2347cd0d46ebSvictorle } else { 23485485867bSBarry Smith aptr[i]++; 23495485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2350cd0d46ebSvictorle } 2351cd0d46ebSvictorle } 2352cd0d46ebSvictorle } 2353cd0d46ebSvictorle done: 23549566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23559566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 2358cd0d46ebSvictorle PetscFunctionReturn(0); 2359cd0d46ebSvictorle } 2360cd0d46ebSvictorle 2361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2362d71ae5a4SJacob Faibussowitsch { 23633d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 236454f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 236554f21887SBarry Smith MatScalar *va, *vb; 23661cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23671cbb95d3SBarry Smith 23681cbb95d3SBarry Smith PetscFunctionBegin; 23699566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23709566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23711cbb95d3SBarry Smith if (ma != nb || na != mb) { 23721cbb95d3SBarry Smith *f = PETSC_FALSE; 23731cbb95d3SBarry Smith PetscFunctionReturn(0); 23741cbb95d3SBarry Smith } 23759371c9d4SSatish Balay aii = aij->i; 23769371c9d4SSatish Balay bii = bij->i; 23779371c9d4SSatish Balay adx = aij->j; 23789371c9d4SSatish Balay bdx = bij->j; 23799371c9d4SSatish Balay va = aij->a; 23809371c9d4SSatish Balay vb = bij->a; 23819566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23831cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 23841cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 23851cbb95d3SBarry Smith 23861cbb95d3SBarry Smith *f = PETSC_TRUE; 23871cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 23881cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 23891cbb95d3SBarry Smith PetscInt idc, idr; 23901cbb95d3SBarry Smith PetscScalar vc, vr; 23911cbb95d3SBarry Smith /* column/row index/value */ 23921cbb95d3SBarry Smith idc = adx[aptr[i]]; 23931cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 23941cbb95d3SBarry Smith vc = va[aptr[i]]; 23951cbb95d3SBarry Smith vr = vb[bptr[idc]]; 23961cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 23971cbb95d3SBarry Smith *f = PETSC_FALSE; 23981cbb95d3SBarry Smith goto done; 23991cbb95d3SBarry Smith } else { 24001cbb95d3SBarry Smith aptr[i]++; 24011cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24021cbb95d3SBarry Smith } 24031cbb95d3SBarry Smith } 24041cbb95d3SBarry Smith } 24051cbb95d3SBarry Smith done: 24069566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24079566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24081cbb95d3SBarry Smith PetscFunctionReturn(0); 24091cbb95d3SBarry Smith } 24101cbb95d3SBarry Smith 2411d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2412d71ae5a4SJacob Faibussowitsch { 24139e29f15eSvictorle PetscFunctionBegin; 24149566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f)); 24159e29f15eSvictorle PetscFunctionReturn(0); 24169e29f15eSvictorle } 24179e29f15eSvictorle 2418d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2419d71ae5a4SJacob Faibussowitsch { 24201cbb95d3SBarry Smith PetscFunctionBegin; 24219566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f)); 24221cbb95d3SBarry Smith PetscFunctionReturn(0); 24231cbb95d3SBarry Smith } 24241cbb95d3SBarry Smith 2425d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2426d71ae5a4SJacob Faibussowitsch { 2427416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2428fff8e43fSBarry Smith const PetscScalar *l, *r; 2429fff8e43fSBarry Smith PetscScalar x; 243054f21887SBarry Smith MatScalar *v; 2431fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2432fff8e43fSBarry Smith const PetscInt *jj; 243317ab2063SBarry Smith 24343a40ed3dSBarry Smith PetscFunctionBegin; 243517ab2063SBarry Smith if (ll) { 24363ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24373ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24389566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 243908401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24409566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 244217ab2063SBarry Smith for (i = 0; i < m; i++) { 244317ab2063SBarry Smith x = l[i]; 2444416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24452205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 244617ab2063SBarry Smith } 24479566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24489566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 245017ab2063SBarry Smith } 245117ab2063SBarry Smith if (rr) { 24529566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 245308401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24549566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24562e5835c6SStefano Zampini jj = a->j; 24572205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24599566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24609566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 246117ab2063SBarry Smith } 24629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24633a40ed3dSBarry Smith PetscFunctionReturn(0); 246417ab2063SBarry Smith } 246517ab2063SBarry Smith 2466d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2467d71ae5a4SJacob Faibussowitsch { 2468db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2469d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 247097f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24715d0c19d7SBarry Smith const PetscInt *irow, *icol; 24722e5835c6SStefano Zampini const PetscScalar *aa; 24735d0c19d7SBarry Smith PetscInt nrows, ncols; 247497f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 247554f21887SBarry Smith MatScalar *a_new, *mat_a; 2476416022c9SBarry Smith Mat C; 2477cdc6f3adSToby Isaac PetscBool stride; 247817ab2063SBarry Smith 24793a40ed3dSBarry Smith PetscFunctionBegin; 24809566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24819566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24829566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 248317ab2063SBarry Smith 24849566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2485ff718158SBarry Smith if (stride) { 24869566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2487ff718158SBarry Smith } else { 2488ff718158SBarry Smith first = 0; 2489ff718158SBarry Smith step = 0; 2490ff718158SBarry Smith } 2491fee21e36SBarry Smith if (stride && step == 1) { 249202834360SBarry Smith /* special case of contiguous rows */ 24939566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 249402834360SBarry Smith /* loop over new rows determining lens and starting points */ 249502834360SBarry Smith for (i = 0; i < nrows; i++) { 2496bfeeae90SHong Zhang kstart = ai[irow[i]]; 2497a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2498a91a9bebSLisandro Dalcin starts[i] = kstart; 249902834360SBarry Smith for (k = kstart; k < kend; k++) { 2500bfeeae90SHong Zhang if (aj[k] >= first) { 250102834360SBarry Smith starts[i] = k; 250202834360SBarry Smith break; 250302834360SBarry Smith } 250402834360SBarry Smith } 2505a2744918SBarry Smith sum = 0; 250602834360SBarry Smith while (k < kend) { 2507bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2508a2744918SBarry Smith sum++; 250902834360SBarry Smith } 2510a2744918SBarry Smith lens[i] = sum; 251102834360SBarry Smith } 251202834360SBarry Smith /* create submatrix */ 2513cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 251497f1f81fSBarry Smith PetscInt n_cols, n_rows; 25159566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2516aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25179566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 251808480c60SBarry Smith C = *B; 25193a40ed3dSBarry Smith } else { 25203bef6203SJed Brown PetscInt rbs, cbs; 25219566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25229566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25239566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25249566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25259566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25269566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 252808480c60SBarry Smith } 2529db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2530db02288aSLois Curfman McInnes 253102834360SBarry Smith /* loop over rows inserting into submatrix */ 2532db02288aSLois Curfman McInnes a_new = c->a; 2533db02288aSLois Curfman McInnes j_new = c->j; 2534db02288aSLois Curfman McInnes i_new = c->i; 25359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 253602834360SBarry Smith for (i = 0; i < nrows; i++) { 2537a2744918SBarry Smith ii = starts[i]; 2538a2744918SBarry Smith lensi = lens[i]; 2539ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25409566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2541a2744918SBarry Smith a_new += lensi; 2542a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2543a2744918SBarry Smith c->ilen[i] = lensi; 254402834360SBarry Smith } 25459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25469566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25473a40ed3dSBarry Smith } else { 25489566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25499566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25514dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25526bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25534dcab191SBarry Smith smap[icol[i]] = i + 1; 25544dcab191SBarry Smith } 25554dcab191SBarry Smith 255602834360SBarry Smith /* determine lens of each row */ 255702834360SBarry Smith for (i = 0; i < nrows; i++) { 2558bfeeae90SHong Zhang kstart = ai[irow[i]]; 255902834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 256002834360SBarry Smith lens[i] = 0; 256102834360SBarry Smith for (k = kstart; k < kend; k++) { 2562ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 256302834360SBarry Smith } 256402834360SBarry Smith } 256517ab2063SBarry Smith /* Create and fill new matrix */ 2566a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2567ace3abfcSBarry Smith PetscBool equal; 25680f5bd95cSBarry Smith 256999141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2570aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25719566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 257228b400f6SJacob Faibussowitsch PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong no of nonzeros"); 25739566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 257408480c60SBarry Smith C = *B; 25753a40ed3dSBarry Smith } else { 25763bef6203SJed Brown PetscInt rbs, cbs; 25779566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25789566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25799566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25809566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25819566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25829566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 258408480c60SBarry Smith } 25859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 258699141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 258717ab2063SBarry Smith for (i = 0; i < nrows; i++) { 258899141d43SSatish Balay row = irow[i]; 2589bfeeae90SHong Zhang kstart = ai[row]; 259099141d43SSatish Balay kend = kstart + a->ilen[row]; 2591bfeeae90SHong Zhang mat_i = c->i[i]; 259299141d43SSatish Balay mat_j = c->j + mat_i; 259399141d43SSatish Balay mat_a = c->a + mat_i; 259499141d43SSatish Balay mat_ilen = c->ilen + i; 259517ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2596bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2597ed480e8bSBarry Smith *mat_j++ = tcol - 1; 25982e5835c6SStefano Zampini *mat_a++ = aa[k]; 259999141d43SSatish Balay (*mat_ilen)++; 260017ab2063SBarry Smith } 260117ab2063SBarry Smith } 260217ab2063SBarry Smith } 26039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 260402834360SBarry Smith /* Free work space */ 26059566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26069566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26079566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2608cdc6f3adSToby Isaac /* sort */ 2609cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2610cdc6f3adSToby Isaac PetscInt ilen; 2611cdc6f3adSToby Isaac 2612cdc6f3adSToby Isaac mat_i = c->i[i]; 2613cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2614cdc6f3adSToby Isaac mat_a = c->a + mat_i; 2615cdc6f3adSToby Isaac ilen = c->ilen[i]; 26169566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2617cdc6f3adSToby Isaac } 261802834360SBarry Smith } 26198c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26209566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2621305c6ccfSStefano Zampini #endif 26229566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26239566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 262417ab2063SBarry Smith 26259566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2626416022c9SBarry Smith *B = C; 26273a40ed3dSBarry Smith PetscFunctionReturn(0); 262817ab2063SBarry Smith } 262917ab2063SBarry Smith 2630d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2631d71ae5a4SJacob Faibussowitsch { 263282d44351SHong Zhang Mat B; 263382d44351SHong Zhang 263482d44351SHong Zhang PetscFunctionBegin; 2635c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26369566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26379566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26389566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26399566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26409566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 264182d44351SHong Zhang *subMat = B; 2642c2d650bdSHong Zhang } else { 26439566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2644c2d650bdSHong Zhang } 264582d44351SHong Zhang PetscFunctionReturn(0); 264682d44351SHong Zhang } 264782d44351SHong Zhang 2648d71ae5a4SJacob Faibussowitsch PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2649d71ae5a4SJacob Faibussowitsch { 265063b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 265163b91edcSBarry Smith Mat outA; 2652ace3abfcSBarry Smith PetscBool row_identity, col_identity; 265363b91edcSBarry Smith 26543a40ed3dSBarry Smith PetscFunctionBegin; 265508401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26561df811f5SHong Zhang 26579566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26589566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2659a871dcd8SBarry Smith 266063b91edcSBarry Smith outA = inA; 2661d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26629566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26639566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26642205254eSKarl Rupp 26659566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26669566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26672205254eSKarl Rupp 2668c3122656SLisandro Dalcin a->row = row; 26692205254eSKarl Rupp 26709566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26719566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26722205254eSKarl Rupp 2673c3122656SLisandro Dalcin a->col = col; 267463b91edcSBarry Smith 267536db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26769566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26779566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2678f0ec6fceSSatish Balay 267994a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 268194a9d846SBarry Smith } 268263b91edcSBarry Smith 26839566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2684137fb511SHong Zhang if (row_identity && col_identity) { 26859566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2686137fb511SHong Zhang } else { 26879566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2688137fb511SHong Zhang } 26893a40ed3dSBarry Smith PetscFunctionReturn(0); 2690a871dcd8SBarry Smith } 2691a871dcd8SBarry Smith 2692d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2693d71ae5a4SJacob Faibussowitsch { 2694f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2695dfa0f9e5SStefano Zampini PetscScalar *v; 2696c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 26973a40ed3dSBarry Smith 26983a40ed3dSBarry Smith PetscFunctionBegin; 26999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27009566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2701792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27029566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27053a40ed3dSBarry Smith PetscFunctionReturn(0); 2706f0b747eeSBarry Smith } 2707f0b747eeSBarry Smith 2708d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2709d71ae5a4SJacob Faibussowitsch { 271016b64355SHong Zhang PetscInt i; 271116b64355SHong Zhang 271216b64355SHong Zhang PetscFunctionBegin; 271316b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27149566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 271516b64355SHong Zhang 271648a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27179566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 271816b64355SHong Zhang 271916b64355SHong Zhang if (submatj->rbuf1) { 27209566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27219566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 272216b64355SHong Zhang } 272316b64355SHong Zhang 272448a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27259566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27269566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 272716b64355SHong Zhang } 272816b64355SHong Zhang 272916b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2730*eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 27319566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27329566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 273316b64355SHong Zhang #else 27349566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 273516b64355SHong Zhang #endif 273616b64355SHong Zhang 273716b64355SHong Zhang if (!submatj->allcolumns) { 273816b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2739*eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap)); 274016b64355SHong Zhang #else 27419566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 274216b64355SHong Zhang #endif 274316b64355SHong Zhang } 27449566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 274516b64355SHong Zhang 27469566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 274716b64355SHong Zhang PetscFunctionReturn(0); 274816b64355SHong Zhang } 274916b64355SHong Zhang 2750d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2751d71ae5a4SJacob Faibussowitsch { 275216b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27535c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 275416b64355SHong Zhang 275516b64355SHong Zhang PetscFunctionBegin; 27569566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27579566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 275816b64355SHong Zhang PetscFunctionReturn(0); 275916b64355SHong Zhang } 276016b64355SHong Zhang 276189a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2762d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2763d71ae5a4SJacob Faibussowitsch { 27642d033e1fSHong Zhang PetscInt i; 27650fb991dcSHong Zhang Mat C; 27660fb991dcSHong Zhang Mat_SeqAIJ *c; 27670fb991dcSHong Zhang Mat_SubSppt *submatj; 27682d033e1fSHong Zhang 27692d033e1fSHong Zhang PetscFunctionBegin; 27702d033e1fSHong Zhang for (i = 0; i < n; i++) { 27710fb991dcSHong Zhang C = (*mat)[i]; 27720fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27730fb991dcSHong Zhang submatj = c->submatis1; 27742d033e1fSHong Zhang if (submatj) { 2775682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 277626cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27779566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27789566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27799566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27803faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27819566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27829566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27839566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2784682e4c99SStefano Zampini } 27852d033e1fSHong Zhang } else { 27869566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 27872d033e1fSHong Zhang } 27882d033e1fSHong Zhang } 278986e85357SHong Zhang 279063a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 27919566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 279263a75b2aSHong Zhang 27939566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 27942d033e1fSHong Zhang PetscFunctionReturn(0); 27952d033e1fSHong Zhang } 27962d033e1fSHong Zhang 2797d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2798d71ae5a4SJacob Faibussowitsch { 279997f1f81fSBarry Smith PetscInt i; 2800cddf8d76SBarry Smith 28013a40ed3dSBarry Smith PetscFunctionBegin; 280248a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2803cddf8d76SBarry Smith 280448a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28053a40ed3dSBarry Smith PetscFunctionReturn(0); 2806cddf8d76SBarry Smith } 2807cddf8d76SBarry Smith 2808d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2809d71ae5a4SJacob Faibussowitsch { 2810e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28115d0c19d7SBarry Smith PetscInt row, i, j, k, l, m, n, *nidx, isz, val; 28125d0c19d7SBarry Smith const PetscInt *idx; 281397f1f81fSBarry Smith PetscInt start, end, *ai, *aj; 2814f1af5d2fSBarry Smith PetscBT table; 2815bbd702dbSSatish Balay 28163a40ed3dSBarry Smith PetscFunctionBegin; 2817d0f46423SBarry Smith m = A->rmap->n; 2818e4d965acSSatish Balay ai = a->i; 2819bfeeae90SHong Zhang aj = a->j; 28208a047759SSatish Balay 282108401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 282206763907SSatish Balay 28239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28249566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 282506763907SSatish Balay 2826e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2827b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2828e4d965acSSatish Balay isz = 0; 28299566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2830e4d965acSSatish Balay 2831e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28329566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28339566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2834e4d965acSSatish Balay 2835dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2836e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28372205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28384dcbc457SBarry Smith } 28399566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28409566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2841e4d965acSSatish Balay 284204a348a9SBarry Smith k = 0; 284304a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 284404a348a9SBarry Smith n = isz; 284506763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2846e4d965acSSatish Balay row = nidx[k]; 2847e4d965acSSatish Balay start = ai[row]; 2848e4d965acSSatish Balay end = ai[row + 1]; 284904a348a9SBarry Smith for (l = start; l < end; l++) { 2850efb16452SHong Zhang val = aj[l]; 28512205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2852e4d965acSSatish Balay } 2853e4d965acSSatish Balay } 2854e4d965acSSatish Balay } 28559566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2856e4d965acSSatish Balay } 28579566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28589566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28593a40ed3dSBarry Smith PetscFunctionReturn(0); 28604dcbc457SBarry Smith } 286117ab2063SBarry Smith 28620513a670SBarry Smith /* -------------------------------------------------------------- */ 2863d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2864d71ae5a4SJacob Faibussowitsch { 28650513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28663b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 28675d0c19d7SBarry Smith const PetscInt *row, *col; 28685d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 286956cd22aeSBarry Smith IS icolp, irowp; 28700298fd71SBarry Smith PetscInt *cwork = NULL; 28710298fd71SBarry Smith PetscScalar *vwork = NULL; 28720513a670SBarry Smith 28733a40ed3dSBarry Smith PetscFunctionBegin; 28749566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 28759566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 28769566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 28779566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 28780513a670SBarry Smith 28790513a670SBarry Smith /* determine lengths of permuted rows */ 28809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 28812205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 28829566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 28839566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 28849566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 28859566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 28869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 28879566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 28880513a670SBarry Smith 28899566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 28900513a670SBarry Smith for (i = 0; i < m; i++) { 28919566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 28922205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 28939566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 28949566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 28950513a670SBarry Smith } 28969566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 28972205254eSKarl Rupp 28983c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 28992205254eSKarl Rupp 29008c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29019566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29029fe5e383SStefano Zampini #endif 29039566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29049566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29059566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29069566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29079566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29089566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 290948a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29103a40ed3dSBarry Smith PetscFunctionReturn(0); 29110513a670SBarry Smith } 29120513a670SBarry Smith 2913d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2914d71ae5a4SJacob Faibussowitsch { 2915cb5b572fSBarry Smith PetscFunctionBegin; 291633f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 291733f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2918be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2919be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29202e5835c6SStefano Zampini const PetscScalar *aa; 2921be6bf707SBarry Smith 29229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 292308401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29249566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29259566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2927cb5b572fSBarry Smith } else { 29289566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2929cb5b572fSBarry Smith } 2930cb5b572fSBarry Smith PetscFunctionReturn(0); 2931cb5b572fSBarry Smith } 2932cb5b572fSBarry Smith 2933d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetUp_SeqAIJ(Mat A) 2934d71ae5a4SJacob Faibussowitsch { 2935273d9f13SBarry Smith PetscFunctionBegin; 29369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, PETSC_DEFAULT, NULL)); 2937273d9f13SBarry Smith PetscFunctionReturn(0); 2938273d9f13SBarry Smith } 2939273d9f13SBarry Smith 2940d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2941d71ae5a4SJacob Faibussowitsch { 29426c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29436e111a19SKarl Rupp 29446c0721eeSBarry Smith PetscFunctionBegin; 29456c0721eeSBarry Smith *array = a->a; 29466c0721eeSBarry Smith PetscFunctionReturn(0); 29476c0721eeSBarry Smith } 29486c0721eeSBarry Smith 2949d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2950d71ae5a4SJacob Faibussowitsch { 29516c0721eeSBarry Smith PetscFunctionBegin; 2952f38c1e66SStefano Zampini *array = NULL; 29536c0721eeSBarry Smith PetscFunctionReturn(0); 29546c0721eeSBarry Smith } 2955273d9f13SBarry Smith 29568229c054SShri Abhyankar /* 29578229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29588229c054SShri Abhyankar have different nonzero structure. 29598229c054SShri Abhyankar */ 2960d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2961d71ae5a4SJacob Faibussowitsch { 2962b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2963ec7775f6SShri Abhyankar 2964ec7775f6SShri Abhyankar PetscFunctionBegin; 2965ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2966ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 2967b264fe52SHong Zhang const PetscInt *xjj = xj + xi[i], *yjj = yj + yi[i]; 2968b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 2969b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 29708af7cee1SJed Brown nnz[i] = 0; 29718af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 2972b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 2973b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 29748af7cee1SJed Brown nnz[i]++; 29758af7cee1SJed Brown } 29768af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 2977ec7775f6SShri Abhyankar } 2978ec7775f6SShri Abhyankar PetscFunctionReturn(0); 2979ec7775f6SShri Abhyankar } 2980ec7775f6SShri Abhyankar 2981d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 2982d71ae5a4SJacob Faibussowitsch { 2983b264fe52SHong Zhang PetscInt m = Y->rmap->N; 2984b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 2985b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 2986b264fe52SHong Zhang 2987b264fe52SHong Zhang PetscFunctionBegin; 2988b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 29899566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 2990b264fe52SHong Zhang PetscFunctionReturn(0); 2991b264fe52SHong Zhang } 2992b264fe52SHong Zhang 2993d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 2994d71ae5a4SJacob Faibussowitsch { 2995ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 2996ac90fabeSBarry Smith 2997ac90fabeSBarry Smith PetscFunctionBegin; 2998134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 2999134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3000134adf20SPierre Jolivet if (e) { 30019566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 300281fa06acSBarry Smith if (e) { 30039566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3004134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 300581fa06acSBarry Smith } 300681fa06acSBarry Smith } 300754c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 300881fa06acSBarry Smith } 3009ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30102e5835c6SStefano Zampini const PetscScalar *xa; 30112e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 301281fa06acSBarry Smith PetscBLASInt one = 1, bnz; 301381fa06acSBarry Smith 30149566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3017792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30209566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30229566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3023ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30249566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3025ac90fabeSBarry Smith } else { 30268229c054SShri Abhyankar Mat B; 30278229c054SShri Abhyankar PetscInt *nnz; 30289566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30299566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30309566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30319566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30329566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30339566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30359566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30369566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30379bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30389566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3039ac90fabeSBarry Smith } 3040ac90fabeSBarry Smith PetscFunctionReturn(0); 3041ac90fabeSBarry Smith } 3042ac90fabeSBarry Smith 3043d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3044d71ae5a4SJacob Faibussowitsch { 3045354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3046354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3047354c94deSBarry Smith PetscInt i, nz; 3048354c94deSBarry Smith PetscScalar *a; 3049354c94deSBarry Smith 3050354c94deSBarry Smith PetscFunctionBegin; 3051354c94deSBarry Smith nz = aij->nz; 30529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30532205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3055354c94deSBarry Smith #else 3056354c94deSBarry Smith PetscFunctionBegin; 3057354c94deSBarry Smith #endif 3058354c94deSBarry Smith PetscFunctionReturn(0); 3059354c94deSBarry Smith } 3060354c94deSBarry Smith 3061d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3062d71ae5a4SJacob Faibussowitsch { 3063e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3064d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3065e34fafa9SBarry Smith PetscReal atmp; 3066985db425SBarry Smith PetscScalar *x; 3067ce496241SStefano Zampini const MatScalar *aa, *av; 3068e34fafa9SBarry Smith 3069e34fafa9SBarry Smith PetscFunctionBegin; 307028b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 30719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3072ce496241SStefano Zampini aa = av; 3073e34fafa9SBarry Smith ai = a->i; 3074e34fafa9SBarry Smith aj = a->j; 3075e34fafa9SBarry Smith 30769566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 30779566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 30789566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 307908401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3080e34fafa9SBarry Smith for (i = 0; i < m; i++) { 30819371c9d4SSatish Balay ncols = ai[1] - ai[0]; 30829371c9d4SSatish Balay ai++; 3083e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3084985db425SBarry Smith atmp = PetscAbsScalar(*aa); 30859371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 30869371c9d4SSatish Balay x[i] = atmp; 30879371c9d4SSatish Balay if (idx) idx[i] = *aj; 30889371c9d4SSatish Balay } 30899371c9d4SSatish Balay aa++; 30909371c9d4SSatish Balay aj++; 3091985db425SBarry Smith } 3092985db425SBarry Smith } 30939566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 30949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3095985db425SBarry Smith PetscFunctionReturn(0); 3096985db425SBarry Smith } 3097985db425SBarry Smith 3098d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3099d71ae5a4SJacob Faibussowitsch { 3100985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3101d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3102985db425SBarry Smith PetscScalar *x; 3103ce496241SStefano Zampini const MatScalar *aa, *av; 3104985db425SBarry Smith 3105985db425SBarry Smith PetscFunctionBegin; 310628b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3108ce496241SStefano Zampini aa = av; 3109985db425SBarry Smith ai = a->i; 3110985db425SBarry Smith aj = a->j; 3111985db425SBarry Smith 31129566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31139566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31149566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 311508401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3116985db425SBarry Smith for (i = 0; i < m; i++) { 31179371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31189371c9d4SSatish Balay ai++; 3119d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31209371c9d4SSatish Balay x[i] = *aa; 31219371c9d4SSatish Balay if (idx) idx[i] = 0; 3122985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3123985db425SBarry Smith x[i] = 0.0; 3124985db425SBarry Smith if (idx) { 3125985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3126985db425SBarry Smith if (aj[j] > j) { 3127985db425SBarry Smith idx[i] = j; 3128985db425SBarry Smith break; 3129985db425SBarry Smith } 3130985db425SBarry Smith } 31311a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31321a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3133985db425SBarry Smith } 3134985db425SBarry Smith } 3135985db425SBarry Smith for (j = 0; j < ncols; j++) { 31369371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31379371c9d4SSatish Balay x[i] = *aa; 31389371c9d4SSatish Balay if (idx) idx[i] = *aj; 31399371c9d4SSatish Balay } 31409371c9d4SSatish Balay aa++; 31419371c9d4SSatish Balay aj++; 3142985db425SBarry Smith } 3143985db425SBarry Smith } 31449566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3146985db425SBarry Smith PetscFunctionReturn(0); 3147985db425SBarry Smith } 3148985db425SBarry Smith 3149d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3150d71ae5a4SJacob Faibussowitsch { 3151c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3152c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3153ce496241SStefano Zampini PetscScalar *x; 3154ce496241SStefano Zampini const MatScalar *aa, *av; 3155c87e5d42SMatthew Knepley 3156c87e5d42SMatthew Knepley PetscFunctionBegin; 31579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3158ce496241SStefano Zampini aa = av; 3159c87e5d42SMatthew Knepley ai = a->i; 3160c87e5d42SMatthew Knepley aj = a->j; 3161c87e5d42SMatthew Knepley 31629566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31639566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31649566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 316508401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3166c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 31679371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31689371c9d4SSatish Balay ai++; 3169f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 31709371c9d4SSatish Balay x[i] = *aa; 31719371c9d4SSatish Balay if (idx) idx[i] = 0; 3172f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3173f07e67edSHong Zhang x[i] = 0.0; 3174f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3175289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3176f07e67edSHong Zhang if (aj[j] > j) { 3177f07e67edSHong Zhang idx[i] = j; 31782205254eSKarl Rupp break; 31792205254eSKarl Rupp } 3180289a08f5SMatthew Knepley } 3181f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3182f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3183f07e67edSHong Zhang } 3184289a08f5SMatthew Knepley } 3185c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 31869371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 31879371c9d4SSatish Balay x[i] = *aa; 31889371c9d4SSatish Balay if (idx) idx[i] = *aj; 31899371c9d4SSatish Balay } 31909371c9d4SSatish Balay aa++; 31919371c9d4SSatish Balay aj++; 3192c87e5d42SMatthew Knepley } 3193c87e5d42SMatthew Knepley } 31949566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3196c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3197c87e5d42SMatthew Knepley } 3198c87e5d42SMatthew Knepley 3199d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3200d71ae5a4SJacob Faibussowitsch { 3201985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3202d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3203d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3204985db425SBarry Smith PetscScalar *x; 3205ce496241SStefano Zampini const MatScalar *aa, *av; 3206985db425SBarry Smith 3207985db425SBarry Smith PetscFunctionBegin; 320828b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3210ce496241SStefano Zampini aa = av; 3211985db425SBarry Smith ai = a->i; 3212985db425SBarry Smith aj = a->j; 3213985db425SBarry Smith 32149566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32159566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32169566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 321708401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3218985db425SBarry Smith for (i = 0; i < m; i++) { 32199371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32209371c9d4SSatish Balay ai++; 3221d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32229371c9d4SSatish Balay x[i] = *aa; 32239371c9d4SSatish Balay if (idx) idx[i] = 0; 3224985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3225985db425SBarry Smith x[i] = 0.0; 3226985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3227985db425SBarry Smith for (j = 0; j < ncols; j++) { 3228985db425SBarry Smith if (aj[j] > j) { 3229985db425SBarry Smith idx[i] = j; 3230985db425SBarry Smith break; 3231985db425SBarry Smith } 3232985db425SBarry Smith } 3233fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3234fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3235985db425SBarry Smith } 3236985db425SBarry Smith } 3237985db425SBarry Smith for (j = 0; j < ncols; j++) { 32389371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32399371c9d4SSatish Balay x[i] = *aa; 32409371c9d4SSatish Balay if (idx) idx[i] = *aj; 32419371c9d4SSatish Balay } 32429371c9d4SSatish Balay aa++; 32439371c9d4SSatish Balay aj++; 3244e34fafa9SBarry Smith } 3245e34fafa9SBarry Smith } 32469566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3248e34fafa9SBarry Smith PetscFunctionReturn(0); 3249e34fafa9SBarry Smith } 3250bbead8a2SBarry Smith 3251d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3252d71ae5a4SJacob Faibussowitsch { 3253bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 325433d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3255bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 32560da83c2eSBarry Smith const PetscReal shift = 0.0; 32571a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3258bbead8a2SBarry Smith 3259bbead8a2SBarry Smith PetscFunctionBegin; 3260a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 32614a0d0026SBarry Smith if (a->ibdiagvalid) { 32624a0d0026SBarry Smith if (values) *values = a->ibdiag; 32634a0d0026SBarry Smith PetscFunctionReturn(0); 32644a0d0026SBarry Smith } 32659566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 32664dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3267bbead8a2SBarry Smith diag = a->ibdiag; 3268bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3269bbead8a2SBarry Smith /* factor and invert each block */ 3270bbead8a2SBarry Smith switch (bs) { 3271bbead8a2SBarry Smith case 1: 3272bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 32739566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3274ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3275ec1892c8SHong Zhang if (allowzeropivot) { 32767b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 32777b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 32787b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 32799566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 328098921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3281ec1892c8SHong Zhang } 3282bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3283bbead8a2SBarry Smith } 3284bbead8a2SBarry Smith break; 3285bbead8a2SBarry Smith case 2: 3286bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 32879371c9d4SSatish Balay ij[0] = 2 * i; 32889371c9d4SSatish Balay ij[1] = 2 * i + 1; 32899566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 32909566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 32917b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 32929566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3293bbead8a2SBarry Smith diag += 4; 3294bbead8a2SBarry Smith } 3295bbead8a2SBarry Smith break; 3296bbead8a2SBarry Smith case 3: 3297bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 32989371c9d4SSatish Balay ij[0] = 3 * i; 32999371c9d4SSatish Balay ij[1] = 3 * i + 1; 33009371c9d4SSatish Balay ij[2] = 3 * i + 2; 33019566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33029566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33037b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33049566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3305bbead8a2SBarry Smith diag += 9; 3306bbead8a2SBarry Smith } 3307bbead8a2SBarry Smith break; 3308bbead8a2SBarry Smith case 4: 3309bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33109371c9d4SSatish Balay ij[0] = 4 * i; 33119371c9d4SSatish Balay ij[1] = 4 * i + 1; 33129371c9d4SSatish Balay ij[2] = 4 * i + 2; 33139371c9d4SSatish Balay ij[3] = 4 * i + 3; 33149566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33159566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33167b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33179566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3318bbead8a2SBarry Smith diag += 16; 3319bbead8a2SBarry Smith } 3320bbead8a2SBarry Smith break; 3321bbead8a2SBarry Smith case 5: 3322bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33239371c9d4SSatish Balay ij[0] = 5 * i; 33249371c9d4SSatish Balay ij[1] = 5 * i + 1; 33259371c9d4SSatish Balay ij[2] = 5 * i + 2; 33269371c9d4SSatish Balay ij[3] = 5 * i + 3; 33279371c9d4SSatish Balay ij[4] = 5 * i + 4; 33289566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33299566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33307b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33319566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3332bbead8a2SBarry Smith diag += 25; 3333bbead8a2SBarry Smith } 3334bbead8a2SBarry Smith break; 3335bbead8a2SBarry Smith case 6: 3336bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33379371c9d4SSatish Balay ij[0] = 6 * i; 33389371c9d4SSatish Balay ij[1] = 6 * i + 1; 33399371c9d4SSatish Balay ij[2] = 6 * i + 2; 33409371c9d4SSatish Balay ij[3] = 6 * i + 3; 33419371c9d4SSatish Balay ij[4] = 6 * i + 4; 33429371c9d4SSatish Balay ij[5] = 6 * i + 5; 33439566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33449566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33457b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33469566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3347bbead8a2SBarry Smith diag += 36; 3348bbead8a2SBarry Smith } 3349bbead8a2SBarry Smith break; 3350bbead8a2SBarry Smith case 7: 3351bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33529371c9d4SSatish Balay ij[0] = 7 * i; 33539371c9d4SSatish Balay ij[1] = 7 * i + 1; 33549371c9d4SSatish Balay ij[2] = 7 * i + 2; 33559371c9d4SSatish Balay ij[3] = 7 * i + 3; 33569371c9d4SSatish Balay ij[4] = 7 * i + 4; 33579371c9d4SSatish Balay ij[5] = 7 * i + 5; 33589371c9d4SSatish Balay ij[5] = 7 * i + 6; 33599566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 33609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 33617b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3363bbead8a2SBarry Smith diag += 49; 3364bbead8a2SBarry Smith } 3365bbead8a2SBarry Smith break; 3366bbead8a2SBarry Smith default: 33679566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3368bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3369ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 33709566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 33719566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 33727b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33739566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3374bbead8a2SBarry Smith diag += bs2; 3375bbead8a2SBarry Smith } 33769566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3377bbead8a2SBarry Smith } 3378bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3379bbead8a2SBarry Smith PetscFunctionReturn(0); 3380bbead8a2SBarry Smith } 3381bbead8a2SBarry Smith 3382d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3383d71ae5a4SJacob Faibussowitsch { 338473a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3385fff043a9SJunchao Zhang PetscScalar a, *aa; 338673a71a0fSBarry Smith PetscInt m, n, i, j, col; 338773a71a0fSBarry Smith 338873a71a0fSBarry Smith PetscFunctionBegin; 338973a71a0fSBarry Smith if (!x->assembled) { 33909566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 339173a71a0fSBarry Smith for (i = 0; i < m; i++) { 339273a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 33939566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 339473a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 33959566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 339673a71a0fSBarry Smith } 339773a71a0fSBarry Smith } 3398e2ce353bSJunchao Zhang } else { 33999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34009566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3402e2ce353bSJunchao Zhang } 34039566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34049566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 340573a71a0fSBarry Smith PetscFunctionReturn(0); 340673a71a0fSBarry Smith } 340773a71a0fSBarry Smith 3408679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3409d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3410d71ae5a4SJacob Faibussowitsch { 3411679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3412679944adSJunchao Zhang PetscScalar a; 3413679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3414679944adSJunchao Zhang 3415679944adSJunchao Zhang PetscFunctionBegin; 3416679944adSJunchao Zhang nskip = high - low; 34179566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3418679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3419679944adSJunchao Zhang for (i = 0; i < m; i++) { 3420679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34219566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3422679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3423679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34249566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3425679944adSJunchao Zhang } 3426e2ce353bSJunchao Zhang } 34279566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34289566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 3429679944adSJunchao Zhang PetscFunctionReturn(0); 3430679944adSJunchao Zhang } 3431679944adSJunchao Zhang 3432682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 34330a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3434cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3435cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3436cb5b572fSBarry Smith MatMult_SeqAIJ, 343797304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34387c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34397c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3440f4259b30SLisandro Dalcin NULL, 3441f4259b30SLisandro Dalcin NULL, 3442f4259b30SLisandro Dalcin NULL, 3443f4259b30SLisandro Dalcin /* 10*/ NULL, 3444cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3445f4259b30SLisandro Dalcin NULL, 344641f059aeSBarry Smith MatSOR_SeqAIJ, 344791e9d3e2SHong Zhang MatTranspose_SeqAIJ, 344897304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3449cb5b572fSBarry Smith MatEqual_SeqAIJ, 3450cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3451cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3452cb5b572fSBarry Smith MatNorm_SeqAIJ, 3453f4259b30SLisandro Dalcin /* 20*/ NULL, 3454cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3455cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3456cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3457d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3458f4259b30SLisandro Dalcin NULL, 3459f4259b30SLisandro Dalcin NULL, 3460f4259b30SLisandro Dalcin NULL, 3461f4259b30SLisandro Dalcin NULL, 34624994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3463f4259b30SLisandro Dalcin NULL, 3464f4259b30SLisandro Dalcin NULL, 3465f4259b30SLisandro Dalcin NULL, 3466f4259b30SLisandro Dalcin NULL, 3467d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3468f4259b30SLisandro Dalcin NULL, 3469f4259b30SLisandro Dalcin NULL, 3470cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3471f4259b30SLisandro Dalcin NULL, 3472d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 34737dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3474cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3475cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3476cb5b572fSBarry Smith MatCopy_SeqAIJ, 3477d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3478cb5b572fSBarry Smith MatScale_SeqAIJ, 34797d68702bSBarry Smith MatShift_SeqAIJ, 348079299369SBarry Smith MatDiagonalSet_SeqAIJ, 34816e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 348273a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 34833b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 34843b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 34853b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3486a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 348793dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3488f4259b30SLisandro Dalcin NULL, 3489f4259b30SLisandro Dalcin NULL, 3490cda55fadSBarry Smith MatPermute_SeqAIJ, 3491f4259b30SLisandro Dalcin NULL, 3492f4259b30SLisandro Dalcin /* 59*/ NULL, 3493b9b97703SBarry Smith MatDestroy_SeqAIJ, 3494b9b97703SBarry Smith MatView_SeqAIJ, 3495f4259b30SLisandro Dalcin NULL, 3496f4259b30SLisandro Dalcin NULL, 3497f4259b30SLisandro Dalcin /* 64*/ NULL, 3498321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3499f4259b30SLisandro Dalcin NULL, 3500f4259b30SLisandro Dalcin NULL, 3501f4259b30SLisandro Dalcin NULL, 3502d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3503c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3504f4259b30SLisandro Dalcin NULL, 3505f4259b30SLisandro Dalcin NULL, 3506f4259b30SLisandro Dalcin NULL, 3507f4259b30SLisandro Dalcin /* 74*/ NULL, 35083acb8795SBarry Smith MatFDColoringApply_AIJ, 3509f4259b30SLisandro Dalcin NULL, 3510f4259b30SLisandro Dalcin NULL, 3511f4259b30SLisandro Dalcin NULL, 35126ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3513f4259b30SLisandro Dalcin NULL, 3514f4259b30SLisandro Dalcin NULL, 3515f4259b30SLisandro Dalcin NULL, 3516bc011b1eSHong Zhang MatLoad_SeqAIJ, 3517d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35181cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3519f4259b30SLisandro Dalcin NULL, 3520f4259b30SLisandro Dalcin NULL, 3521f4259b30SLisandro Dalcin NULL, 3522f4259b30SLisandro Dalcin /* 89*/ NULL, 3523f4259b30SLisandro Dalcin NULL, 352426be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3525f4259b30SLisandro Dalcin NULL, 3526f4259b30SLisandro Dalcin NULL, 35278fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3528f4259b30SLisandro Dalcin NULL, 3529f4259b30SLisandro Dalcin NULL, 35306fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3531f4259b30SLisandro Dalcin NULL, 35324222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3533f4259b30SLisandro Dalcin NULL, 3534f4259b30SLisandro Dalcin NULL, 353587d4246cSBarry Smith MatConjugate_SeqAIJ, 3536f4259b30SLisandro Dalcin NULL, 3537d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 353899cafbc1SBarry Smith MatRealPart_SeqAIJ, 3539f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3540f4259b30SLisandro Dalcin NULL, 3541f4259b30SLisandro Dalcin NULL, 3542cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3543f4259b30SLisandro Dalcin NULL, 35442af78befSBarry Smith MatGetRowMin_SeqAIJ, 3545f4259b30SLisandro Dalcin NULL, 3546599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3547f4259b30SLisandro Dalcin /*114*/ NULL, 3548f4259b30SLisandro Dalcin NULL, 3549f4259b30SLisandro Dalcin NULL, 3550f4259b30SLisandro Dalcin NULL, 3551f4259b30SLisandro Dalcin NULL, 3552f4259b30SLisandro Dalcin /*119*/ NULL, 3553f4259b30SLisandro Dalcin NULL, 3554f4259b30SLisandro Dalcin NULL, 3555f4259b30SLisandro Dalcin NULL, 3556b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 35570716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3558a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 355937868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 35600da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3561f4259b30SLisandro Dalcin NULL, 3562f4259b30SLisandro Dalcin /*129*/ NULL, 3563f4259b30SLisandro Dalcin NULL, 3564f4259b30SLisandro Dalcin NULL, 356575648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3566b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3567b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 35682b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3569f4259b30SLisandro Dalcin NULL, 3570f4259b30SLisandro Dalcin NULL, 35713964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3572f4259b30SLisandro Dalcin /*139*/ NULL, 3573f4259b30SLisandro Dalcin NULL, 3574f4259b30SLisandro Dalcin NULL, 35753a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 35769c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 35774222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 35784222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3579f4259b30SLisandro Dalcin NULL, 358072833a62Smarkadams4 NULL, 358172833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 35822d776b49SBarry Smith NULL, 3583dec0b466SHong Zhang /*150*/ MatTransposeSymbolic_SeqAIJ, 3584dec0b466SHong Zhang MatEliminateZeros_SeqAIJ}; 358517ab2063SBarry Smith 3586d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3587d71ae5a4SJacob Faibussowitsch { 3588bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 358997f1f81fSBarry Smith PetscInt i, nz, n; 3590bef8e0ddSBarry Smith 3591bef8e0ddSBarry Smith PetscFunctionBegin; 3592bef8e0ddSBarry Smith nz = aij->maxnz; 3593d0f46423SBarry Smith n = mat->rmap->n; 3594ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3595bef8e0ddSBarry Smith aij->nz = nz; 3596ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 3597bef8e0ddSBarry Smith PetscFunctionReturn(0); 3598bef8e0ddSBarry Smith } 3599bef8e0ddSBarry Smith 3600a3bb6f32SFande Kong /* 3601ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3602ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3603ddea5d60SJunchao Zhang */ 3604d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3605d71ae5a4SJacob Faibussowitsch { 3606a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3607*eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3608*eec179cfSJacob Faibussowitsch PetscHashIter tpos; 360925b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 361025b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3611a3bb6f32SFande Kong 3612a3bb6f32SFande Kong PetscFunctionBegin; 3613a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3614a3bb6f32SFande Kong PetscValidPointer(mapping, 2); 3615a3bb6f32SFande Kong /* use a table */ 3616*eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3617a3bb6f32SFande Kong ec = 0; 361825b670f0SStefano Zampini for (i = 0; i < nz; i++) { 361925b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3620*eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3621a3bb6f32SFande Kong if (!data) { 3622a3bb6f32SFande Kong /* one based table */ 3623*eec179cfSJacob Faibussowitsch PetscCall(PetscHMapISetWithMode(gid1_lid1, gid1, ++ec, INSERT_VALUES)); 3624a3bb6f32SFande Kong } 3625a3bb6f32SFande Kong } 3626a3bb6f32SFande Kong /* form array of columns we need */ 36279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3628*eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3629*eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3630*eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3631*eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3632*eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3633a3bb6f32SFande Kong gid--; 3634a3bb6f32SFande Kong lid--; 3635a3bb6f32SFande Kong garray[lid] = gid; 3636a3bb6f32SFande Kong } 36379566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3638*eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3639*eec179cfSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISetWithMode(gid1_lid1, garray[i] + 1, i + 1, INSERT_VALUES)); 3640a3bb6f32SFande Kong /* compact out the extra columns in B */ 364125b670f0SStefano Zampini for (i = 0; i < nz; i++) { 364225b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3643*eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3644a3bb6f32SFande Kong lid--; 364525b670f0SStefano Zampini jj[i] = lid; 3646a3bb6f32SFande Kong } 36479566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3648*eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 36499566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36509566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36519566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 3652a3bb6f32SFande Kong PetscFunctionReturn(0); 3653a3bb6f32SFande Kong } 3654a3bb6f32SFande Kong 3655bef8e0ddSBarry Smith /*@ 3656bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3657bef8e0ddSBarry Smith in the matrix. 3658bef8e0ddSBarry Smith 3659bef8e0ddSBarry Smith Input Parameters: 366011a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3661bef8e0ddSBarry Smith - indices - the column indices 3662bef8e0ddSBarry Smith 366315091d37SBarry Smith Level: advanced 366415091d37SBarry Smith 3665bef8e0ddSBarry Smith Notes: 3666bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3667bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 366811a5261eSBarry Smith of the `MatSetValues()` operation. 3669bef8e0ddSBarry Smith 3670bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 367111a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3672bef8e0ddSBarry Smith 367311a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3674bef8e0ddSBarry Smith 3675b9617806SBarry Smith The indices should start with zero, not one. 3676b9617806SBarry Smith 3677bef8e0ddSBarry Smith @*/ 3678d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3679d71ae5a4SJacob Faibussowitsch { 3680bef8e0ddSBarry Smith PetscFunctionBegin; 36810700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3682dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 3683cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 3684bef8e0ddSBarry Smith PetscFunctionReturn(0); 3685bef8e0ddSBarry Smith } 3686bef8e0ddSBarry Smith 3687be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3688be6bf707SBarry Smith 3689d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3690d71ae5a4SJacob Faibussowitsch { 3691be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3692d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3693be6bf707SBarry Smith 3694be6bf707SBarry Smith PetscFunctionBegin; 369528b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3696be6bf707SBarry Smith 3697be6bf707SBarry Smith /* allocate space for values if not already there */ 36984dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3699be6bf707SBarry Smith 3700be6bf707SBarry Smith /* copy values over */ 37019566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 3702be6bf707SBarry Smith PetscFunctionReturn(0); 3703be6bf707SBarry Smith } 3704be6bf707SBarry Smith 3705be6bf707SBarry Smith /*@ 3706be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3707be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3708be6bf707SBarry Smith nonlinear portion. 3709be6bf707SBarry Smith 371011a5261eSBarry Smith Collect on mat 3711be6bf707SBarry Smith 3712be6bf707SBarry Smith Input Parameters: 371311a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3714be6bf707SBarry Smith 371515091d37SBarry Smith Level: advanced 371615091d37SBarry Smith 371711a5261eSBarry Smith Common Usage, with `SNESSolve()`: 3718be6bf707SBarry Smith $ Create Jacobian matrix 3719be6bf707SBarry Smith $ Set linear terms into matrix 3720be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3721be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3722be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3723512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3724be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3725be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3726be6bf707SBarry Smith $ In your Jacobian routine 3727be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3728be6bf707SBarry Smith $ Set nonlinear terms in matrix 3729be6bf707SBarry Smith 3730be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3731be6bf707SBarry Smith $ // build linear portion of Jacobian 3732512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3733be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3734be6bf707SBarry Smith $ loop over nonlinear iterations 3735be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3736be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3737be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3738be6bf707SBarry Smith $ Solve linear system with Jacobian 3739be6bf707SBarry Smith $ endloop 3740be6bf707SBarry Smith 3741be6bf707SBarry Smith Notes: 3742be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 374311a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3744be6bf707SBarry Smith calling this routine. 3745be6bf707SBarry Smith 37460c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37470c468ba9SBarry Smith and does not allocated additional space. 37480c468ba9SBarry Smith 3749db781477SPatrick Sanan .seealso: `MatRetrieveValues()` 3750be6bf707SBarry Smith @*/ 3751d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3752d71ae5a4SJacob Faibussowitsch { 3753be6bf707SBarry Smith PetscFunctionBegin; 37540700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 375528b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 375628b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3757cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 3758be6bf707SBarry Smith PetscFunctionReturn(0); 3759be6bf707SBarry Smith } 3760be6bf707SBarry Smith 3761d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3762d71ae5a4SJacob Faibussowitsch { 3763be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3764d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3765be6bf707SBarry Smith 3766be6bf707SBarry Smith PetscFunctionBegin; 376728b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 376828b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3769be6bf707SBarry Smith /* copy values over */ 37709566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 3771be6bf707SBarry Smith PetscFunctionReturn(0); 3772be6bf707SBarry Smith } 3773be6bf707SBarry Smith 3774be6bf707SBarry Smith /*@ 3775be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3776be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3777be6bf707SBarry Smith nonlinear portion. 3778be6bf707SBarry Smith 377911a5261eSBarry Smith Collect on mat 3780be6bf707SBarry Smith 3781be6bf707SBarry Smith Input Parameters: 378211a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3783be6bf707SBarry Smith 378415091d37SBarry Smith Level: advanced 378515091d37SBarry Smith 3786db781477SPatrick Sanan .seealso: `MatStoreValues()` 3787be6bf707SBarry Smith @*/ 3788d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3789d71ae5a4SJacob Faibussowitsch { 3790be6bf707SBarry Smith PetscFunctionBegin; 37910700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 379228b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 379328b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3794cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 3795be6bf707SBarry Smith PetscFunctionReturn(0); 3796be6bf707SBarry Smith } 3797be6bf707SBarry Smith 3798be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 379917ab2063SBarry Smith /*@C 380011a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38010d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 38026e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 380351c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 38042bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 380517ab2063SBarry Smith 3806d083f849SBarry Smith Collective 3807db81eaa0SLois Curfman McInnes 380817ab2063SBarry Smith Input Parameters: 380911a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 381017ab2063SBarry Smith . m - number of rows 381117ab2063SBarry Smith . n - number of columns 381217ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 381351c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38140298fd71SBarry Smith (possibly different for each row) or NULL 381517ab2063SBarry Smith 381617ab2063SBarry Smith Output Parameter: 3817416022c9SBarry Smith . A - the matrix 381817ab2063SBarry Smith 381911a5261eSBarry Smith It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 3820f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 382111a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 3822175b88e8SBarry Smith 3823b259b22eSLois Curfman McInnes Notes: 382449a6f317SBarry Smith If nnz is given then nz is ignored 382549a6f317SBarry Smith 382611a5261eSBarry Smith The AIJ format, also called 382711a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 38280002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 382944cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 383017ab2063SBarry Smith 383117ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 383211a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 38333d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 38346da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 383517ab2063SBarry Smith 3836682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38374fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3838682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38396c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38406c7ebb05SLois Curfman McInnes 38416c7ebb05SLois Curfman McInnes Options Database Keys: 3842698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 38439db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 384417ab2063SBarry Smith 3845027ccd11SLois Curfman McInnes Level: intermediate 3846027ccd11SLois Curfman McInnes 384760161072SBarry Smith .seealso: [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 384817ab2063SBarry Smith @*/ 3849d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3850d71ae5a4SJacob Faibussowitsch { 38513a40ed3dSBarry Smith PetscFunctionBegin; 38529566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38539566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38549566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 3856273d9f13SBarry Smith PetscFunctionReturn(0); 3857273d9f13SBarry Smith } 3858273d9f13SBarry Smith 3859273d9f13SBarry Smith /*@C 3860273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3861273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3862273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3863273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3864273d9f13SBarry Smith 3865d083f849SBarry Smith Collective 3866273d9f13SBarry Smith 3867273d9f13SBarry Smith Input Parameters: 38681c4f3114SJed Brown + B - The matrix 3869273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3870273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38710298fd71SBarry Smith (possibly different for each row) or NULL 3872273d9f13SBarry Smith 3873273d9f13SBarry Smith Notes: 387449a6f317SBarry Smith If nnz is given then nz is ignored 387549a6f317SBarry Smith 387611a5261eSBarry Smith The `MATSEQAIJ` format also called 387711a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 3878273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3879273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3880273d9f13SBarry Smith 3881273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 388211a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 3883273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3884273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3885273d9f13SBarry Smith 388611a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3887aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3888aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3889aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3890aa95bbe8SBarry Smith 389111a5261eSBarry Smith Developer Notes: 389211a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3893a96a251dSBarry Smith entries or columns indices 3894a96a251dSBarry Smith 3895273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3896273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3897273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3898273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3899273d9f13SBarry Smith 3900273d9f13SBarry Smith Options Database Keys: 3901698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 390247b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3903273d9f13SBarry Smith 3904273d9f13SBarry Smith Level: intermediate 3905273d9f13SBarry Smith 3906db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3907db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3908273d9f13SBarry Smith @*/ 3909d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3910d71ae5a4SJacob Faibussowitsch { 3911a23d5eceSKris Buschelman PetscFunctionBegin; 39126ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39136ba663aaSJed Brown PetscValidType(B, 1); 3914cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 3915a23d5eceSKris Buschelman PetscFunctionReturn(0); 3916a23d5eceSKris Buschelman } 3917a23d5eceSKris Buschelman 3918d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3919d71ae5a4SJacob Faibussowitsch { 3920273d9f13SBarry Smith Mat_SeqAIJ *b; 39212576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 392297f1f81fSBarry Smith PetscInt i; 3923273d9f13SBarry Smith 3924273d9f13SBarry Smith PetscFunctionBegin; 39252576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3926a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3927c461c341SBarry Smith skipallocation = PETSC_TRUE; 3928c461c341SBarry Smith nz = 0; 3929c461c341SBarry Smith } 39309566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39319566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3932899cda47SBarry Smith 3933435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 393408401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 3935cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3936d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 393708401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 393808401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3939b73539f3SBarry Smith } 3940b73539f3SBarry Smith } 3941b73539f3SBarry Smith 3942273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 39432205254eSKarl Rupp 3944273d9f13SBarry Smith b = (Mat_SeqAIJ *)B->data; 3945273d9f13SBarry Smith 3946ab93d7beSBarry Smith if (!skipallocation) { 39474dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3948071fcb05SBarry Smith if (!b->ilen) { 3949071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3951071fcb05SBarry Smith } else { 39529566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39532ee49352SLisandro Dalcin } 39544dfa11a4SJacob Faibussowitsch if (!b->ipre) { PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); } 3955273d9f13SBarry Smith if (!nnz) { 3956435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3957c62bd62aSJed Brown else if (nz < 0) nz = 1; 39585d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 3959d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 3960d0f46423SBarry Smith nz = nz * B->rmap->n; 3961273d9f13SBarry Smith } else { 3962c73702f5SBarry Smith PetscInt64 nz64 = 0; 39639371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 39649371c9d4SSatish Balay b->imax[i] = nnz[i]; 39659371c9d4SSatish Balay nz64 += nnz[i]; 39669371c9d4SSatish Balay } 39679566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 3968273d9f13SBarry Smith } 3969ab93d7beSBarry Smith 3970273d9f13SBarry Smith /* allocate the matrix space */ 397153dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 39729566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 3973396832f4SHong Zhang if (B->structure_only) { 39749566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &b->j)); 39759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i)); 3976396832f4SHong Zhang } else { 39779566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i)); 3978396832f4SHong Zhang } 3979bfeeae90SHong Zhang b->i[0] = 0; 3980ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 3981396832f4SHong Zhang if (B->structure_only) { 3982396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 3983396832f4SHong Zhang b->free_a = PETSC_FALSE; 3984396832f4SHong Zhang } else { 3985273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 3986e6b907acSBarry Smith b->free_a = PETSC_TRUE; 3987396832f4SHong Zhang } 3988e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 3989c461c341SBarry Smith } else { 3990e6b907acSBarry Smith b->free_a = PETSC_FALSE; 3991e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 3992c461c341SBarry Smith } 3993273d9f13SBarry Smith 3994846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 3995846b4da1SFande Kong /* reserve user-requested sparsity */ 39969566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 3997846b4da1SFande Kong } 3998846b4da1SFande Kong 3999273d9f13SBarry Smith b->nz = 0; 4000273d9f13SBarry Smith b->maxnz = nz; 4001273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40021baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4003cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4004cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40055519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40065519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40075519a089SJose E. Roman */ 40085519a089SJose E. Roman B->nonzerostate++; 4009273d9f13SBarry Smith PetscFunctionReturn(0); 4010273d9f13SBarry Smith } 4011273d9f13SBarry Smith 4012d71ae5a4SJacob Faibussowitsch PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4013d71ae5a4SJacob Faibussowitsch { 4014846b4da1SFande Kong Mat_SeqAIJ *a; 4015a5bbaf83SFande Kong PetscInt i; 4016846b4da1SFande Kong 4017846b4da1SFande Kong PetscFunctionBegin; 4018846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 401914d0e64fSAlex Lindsay 402014d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 402114d0e64fSAlex Lindsay if (!A->rmap->n) PetscFunctionReturn(0); 402214d0e64fSAlex Lindsay 4023846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40242c814fdeSFande Kong /* if no saved info, we error out */ 402528b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40262c814fdeSFande Kong 4027aed4548fSBarry Smith PetscCheck(a->i && a->j && a->a && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40282c814fdeSFande Kong 40299566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40309566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4031846b4da1SFande Kong a->i[0] = 0; 4032ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4033846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4034846b4da1SFande Kong a->nz = 0; 4035846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4036846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4037846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4038846b4da1SFande Kong A->assembled = PETSC_FALSE; 4039846b4da1SFande Kong PetscFunctionReturn(0); 4040846b4da1SFande Kong } 4041846b4da1SFande Kong 404258d36128SBarry Smith /*@ 404311a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4044a1661176SMatthew Knepley 4045a1661176SMatthew Knepley Input Parameters: 4046a1661176SMatthew Knepley + B - the matrix 4047a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4048a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4049a1661176SMatthew Knepley - v - optional values in the matrix 4050a1661176SMatthew Knepley 4051a1661176SMatthew Knepley Level: developer 4052a1661176SMatthew Knepley 40536a9b8d82SBarry Smith Notes: 405411a5261eSBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 405558d36128SBarry Smith 40566a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 40576a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 40586a9b8d82SBarry Smith 40596a9b8d82SBarry Smith Developer Notes: 40606a9b8d82SBarry Smith An optimization could be added to the implementation where it checks if the i, and j are identical to the current i and j and 406111a5261eSBarry Smith then just copies the v values directly with `PetscMemcpy()`. 40626a9b8d82SBarry Smith 406311a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 40646a9b8d82SBarry Smith 4065db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MatResetPreallocation()` 4066a1661176SMatthew Knepley @*/ 4067d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4068d71ae5a4SJacob Faibussowitsch { 4069a1661176SMatthew Knepley PetscFunctionBegin; 40700700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 40716ba663aaSJed Brown PetscValidType(B, 1); 4072cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 4073a1661176SMatthew Knepley PetscFunctionReturn(0); 4074a1661176SMatthew Knepley } 4075a1661176SMatthew Knepley 4076d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4077d71ae5a4SJacob Faibussowitsch { 4078a1661176SMatthew Knepley PetscInt i; 4079a1661176SMatthew Knepley PetscInt m, n; 4080a1661176SMatthew Knepley PetscInt nz; 40816a9b8d82SBarry Smith PetscInt *nnz; 4082a1661176SMatthew Knepley 4083a1661176SMatthew Knepley PetscFunctionBegin; 4084aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4085779a8d59SSatish Balay 40869566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 40879566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4088779a8d59SSatish Balay 40899566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 40909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4091a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4092b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 409308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4094a1661176SMatthew Knepley nnz[i] = nz; 4095a1661176SMatthew Knepley } 40969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 40979566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4098a1661176SMatthew Knepley 409948a46eb9SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES)); 4100a1661176SMatthew Knepley 41019566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41029566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4103a1661176SMatthew Knepley 41049566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 4105a1661176SMatthew Knepley PetscFunctionReturn(0); 4106a1661176SMatthew Knepley } 4107a1661176SMatthew Knepley 4108ad7e164aSPierre Jolivet /*@ 4109ad7e164aSPierre Jolivet MatSeqAIJKron - Computes C, the Kronecker product of A and B. 4110ad7e164aSPierre Jolivet 4111ad7e164aSPierre Jolivet Input Parameters: 4112ad7e164aSPierre Jolivet + A - left-hand side matrix 4113ad7e164aSPierre Jolivet . B - right-hand side matrix 411411a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4115ad7e164aSPierre Jolivet 4116ad7e164aSPierre Jolivet Output Parameter: 4117ad7e164aSPierre Jolivet . C - Kronecker product of A and B 4118ad7e164aSPierre Jolivet 4119ad7e164aSPierre Jolivet Level: intermediate 4120ad7e164aSPierre Jolivet 412111a5261eSBarry Smith Note: 412211a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4123ad7e164aSPierre Jolivet 4124db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4125ad7e164aSPierre Jolivet @*/ 4126d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4127d71ae5a4SJacob Faibussowitsch { 4128ad7e164aSPierre Jolivet PetscFunctionBegin; 4129ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4130ad7e164aSPierre Jolivet PetscValidType(A, 1); 4131ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4132ad7e164aSPierre Jolivet PetscValidType(B, 2); 4133ad7e164aSPierre Jolivet PetscValidPointer(C, 4); 4134ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4135ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4136ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4137ad7e164aSPierre Jolivet } 4138cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 4139ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4140ad7e164aSPierre Jolivet } 4141ad7e164aSPierre Jolivet 4142d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4143d71ae5a4SJacob Faibussowitsch { 4144ad7e164aSPierre Jolivet Mat newmat; 4145ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4146ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4147ad7e164aSPierre Jolivet PetscScalar *v; 4148fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4149ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4150ad7e164aSPierre Jolivet PetscBool flg; 4151ad7e164aSPierre Jolivet 4152ad7e164aSPierre Jolivet PetscFunctionBegin; 415328b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 415428b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 415528b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 415628b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 41579566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 415828b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4159aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4160ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 41619566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 41629566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 41639566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 41649566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4165ad7e164aSPierre Jolivet i[0] = 0; 4166ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4167ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4168ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4169ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4170ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4171ad7e164aSPierre Jolivet } 4172ad7e164aSPierre Jolivet } 4173ad7e164aSPierre Jolivet } 41749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4175ad7e164aSPierre Jolivet *C = newmat; 41769566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4177ad7e164aSPierre Jolivet nnz = 0; 4178ad7e164aSPierre Jolivet } 41799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 41809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 41819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4182ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4183ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4184ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4185ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4186ad7e164aSPierre Jolivet } 4187ad7e164aSPierre Jolivet } 4188ad7e164aSPierre Jolivet } 41899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 41909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 41919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 4192ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4193ad7e164aSPierre Jolivet } 4194ad7e164aSPierre Jolivet 4195c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4196af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4197170fe5c8SBarry Smith 4198170fe5c8SBarry Smith /* 4199170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4200170fe5c8SBarry Smith 4201170fe5c8SBarry Smith n p p 42022da392ccSBarry Smith [ ] [ ] [ ] 42032da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42042da392ccSBarry Smith [ ] [ ] [ ] 4205170fe5c8SBarry Smith 4206170fe5c8SBarry Smith */ 4207d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4208d71ae5a4SJacob Faibussowitsch { 4209170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4210170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4211170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 421286214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4213170fe5c8SBarry Smith const PetscInt *ii, *idx; 4214170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4215170fe5c8SBarry Smith PetscScalar *c, *c_q; 421686214ceeSStefano Zampini PetscInt clda = sub_c->lda; 421786214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4218170fe5c8SBarry Smith 4219170fe5c8SBarry Smith PetscFunctionBegin; 4220d0f46423SBarry Smith m = A->rmap->n; 4221d0f46423SBarry Smith n = A->cmap->n; 4222d0f46423SBarry Smith p = B->cmap->n; 4223170fe5c8SBarry Smith a = sub_a->v; 4224170fe5c8SBarry Smith b = sub_b->a; 4225170fe5c8SBarry Smith c = sub_c->v; 422686214ceeSStefano Zampini if (clda == m) { 42279566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 422886214ceeSStefano Zampini } else { 422986214ceeSStefano Zampini for (j = 0; j < p; j++) 42309371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 423186214ceeSStefano Zampini } 4232170fe5c8SBarry Smith ii = sub_b->i; 4233170fe5c8SBarry Smith idx = sub_b->j; 4234170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4235170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4236170fe5c8SBarry Smith while (q-- > 0) { 423786214ceeSStefano Zampini c_q = c + clda * (*idx); 423886214ceeSStefano Zampini a_q = a + alda * i; 4239854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4240170fe5c8SBarry Smith idx++; 4241170fe5c8SBarry Smith b++; 4242170fe5c8SBarry Smith } 4243170fe5c8SBarry Smith } 4244170fe5c8SBarry Smith PetscFunctionReturn(0); 4245170fe5c8SBarry Smith } 4246170fe5c8SBarry Smith 4247d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4248d71ae5a4SJacob Faibussowitsch { 4249d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 425086214ceeSStefano Zampini PetscBool cisdense; 4251170fe5c8SBarry Smith 4252170fe5c8SBarry Smith PetscFunctionBegin; 425308401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 42549566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 42559566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 42569566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, "")); 425748a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 42589566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4259d73949e8SHong Zhang 42604222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 4261170fe5c8SBarry Smith PetscFunctionReturn(0); 4262170fe5c8SBarry Smith } 4263170fe5c8SBarry Smith 4264170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 42650bad9183SKris Buschelman /*MC 4266fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 42670bad9183SKris Buschelman based on compressed sparse row format. 42680bad9183SKris Buschelman 42690bad9183SKris Buschelman Options Database Keys: 42700bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 42710bad9183SKris Buschelman 42720bad9183SKris Buschelman Level: beginner 42730bad9183SKris Buschelman 42740cd7f59aSBarry Smith Notes: 427511a5261eSBarry Smith `MatSetValues()` may be called for this matrix type with a NULL argument for the numerical values, 42760cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 42770cd7f59aSBarry Smith in the matrix 42780cd7f59aSBarry Smith 427911a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 428011a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 42810cd7f59aSBarry Smith 428211a5261eSBarry Smith Developer Note: 42830cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 42840cd7f59aSBarry Smith 4285db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 42860bad9183SKris Buschelman M*/ 42870bad9183SKris Buschelman 4288ccd284c7SBarry Smith /*MC 4289ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4290ccd284c7SBarry Smith 429111a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 429211a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 429311a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4294ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4295ccd284c7SBarry Smith the above preallocation routines for simplicity. 4296ccd284c7SBarry Smith 4297ccd284c7SBarry Smith Options Database Keys: 429811a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4299ccd284c7SBarry Smith 430011a5261eSBarry Smith Note: 430111a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4302ccd284c7SBarry Smith enough exist. 4303ccd284c7SBarry Smith 4304ccd284c7SBarry Smith Level: beginner 4305ccd284c7SBarry Smith 4306db781477SPatrick Sanan .seealso: `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4307ccd284c7SBarry Smith M*/ 4308ccd284c7SBarry Smith 4309ccd284c7SBarry Smith /*MC 4310ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4311ccd284c7SBarry Smith 431211a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 431311a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 431411a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4315ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4316ccd284c7SBarry Smith the above preallocation routines for simplicity. 4317ccd284c7SBarry Smith 4318ccd284c7SBarry Smith Options Database Keys: 431911a5261eSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 4320ccd284c7SBarry Smith 4321ccd284c7SBarry Smith Level: beginner 4322ccd284c7SBarry Smith 4323c2e3fba1SPatrick Sanan .seealso: `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4324ccd284c7SBarry Smith M*/ 4325ccd284c7SBarry Smith 43267906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43277906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43287906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43297906f579SHong Zhang #endif 4330d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4331d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4332d24d4204SJose E. Roman #endif 43337906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43347906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43357906f579SHong Zhang #endif 43367906f579SHong Zhang 4337d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4338c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43394222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43407906f579SHong Zhang 43418c778c55SBarry Smith /*@C 434211a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43438c778c55SBarry Smith 43448c778c55SBarry Smith Not Collective 43458c778c55SBarry Smith 43468c778c55SBarry Smith Input Parameter: 434711a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 43488c778c55SBarry Smith 43498c778c55SBarry Smith Output Parameter: 43508c778c55SBarry Smith . array - pointer to the data 43518c778c55SBarry Smith 43528c778c55SBarry Smith Level: intermediate 43538c778c55SBarry Smith 4354db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 43558c778c55SBarry Smith @*/ 4356d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array) 4357d71ae5a4SJacob Faibussowitsch { 4358d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 43598c778c55SBarry Smith 43608c778c55SBarry Smith PetscFunctionBegin; 4361d67d9f35SJunchao Zhang if (aij->ops->getarray) { 43629566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4363d67d9f35SJunchao Zhang } else { 4364d67d9f35SJunchao Zhang *array = aij->a; 4365d67d9f35SJunchao Zhang } 4366d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4367d67d9f35SJunchao Zhang } 4368d67d9f35SJunchao Zhang 4369d67d9f35SJunchao Zhang /*@C 437011a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4371d67d9f35SJunchao Zhang 4372d67d9f35SJunchao Zhang Not Collective 4373d67d9f35SJunchao Zhang 4374d67d9f35SJunchao Zhang Input Parameters: 437511a5261eSBarry Smith + mat - a `MATSEQAIJ` matrix 4376d67d9f35SJunchao Zhang - array - pointer to the data 4377d67d9f35SJunchao Zhang 4378d67d9f35SJunchao Zhang Level: intermediate 4379d67d9f35SJunchao Zhang 4380db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4381d67d9f35SJunchao Zhang @*/ 4382d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array) 4383d71ae5a4SJacob Faibussowitsch { 4384d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4385d67d9f35SJunchao Zhang 4386d67d9f35SJunchao Zhang PetscFunctionBegin; 4387d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 43889566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4389d67d9f35SJunchao Zhang } else { 4390d67d9f35SJunchao Zhang *array = NULL; 4391d67d9f35SJunchao Zhang } 43929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 43939566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 43948c778c55SBarry Smith PetscFunctionReturn(0); 43958c778c55SBarry Smith } 43968c778c55SBarry Smith 439721e72a00SBarry Smith /*@C 439811a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 43998f1ea47aSStefano Zampini 44008f1ea47aSStefano Zampini Not Collective 44018f1ea47aSStefano Zampini 44028f1ea47aSStefano Zampini Input Parameter: 440311a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44048f1ea47aSStefano Zampini 44058f1ea47aSStefano Zampini Output Parameter: 44068f1ea47aSStefano Zampini . array - pointer to the data 44078f1ea47aSStefano Zampini 44088f1ea47aSStefano Zampini Level: intermediate 44098f1ea47aSStefano Zampini 4410db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44118f1ea47aSStefano Zampini @*/ 4412d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array) 4413d71ae5a4SJacob Faibussowitsch { 4414d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44158f1ea47aSStefano Zampini 44168f1ea47aSStefano Zampini PetscFunctionBegin; 4417d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44189566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4419d67d9f35SJunchao Zhang } else { 4420d67d9f35SJunchao Zhang *array = aij->a; 4421d67d9f35SJunchao Zhang } 44228f1ea47aSStefano Zampini PetscFunctionReturn(0); 44238f1ea47aSStefano Zampini } 44248f1ea47aSStefano Zampini 44258f1ea47aSStefano Zampini /*@C 442611a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44278f1ea47aSStefano Zampini 44288f1ea47aSStefano Zampini Not Collective 44298f1ea47aSStefano Zampini 44308f1ea47aSStefano Zampini Input Parameter: 443111a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44328f1ea47aSStefano Zampini 44338f1ea47aSStefano Zampini Output Parameter: 44348f1ea47aSStefano Zampini . array - pointer to the data 44358f1ea47aSStefano Zampini 44368f1ea47aSStefano Zampini Level: intermediate 44378f1ea47aSStefano Zampini 4438db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44398f1ea47aSStefano Zampini @*/ 4440d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array) 4441d71ae5a4SJacob Faibussowitsch { 4442d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44438f1ea47aSStefano Zampini 44448f1ea47aSStefano Zampini PetscFunctionBegin; 4445d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44469566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4447d67d9f35SJunchao Zhang } else { 4448d67d9f35SJunchao Zhang *array = NULL; 4449d67d9f35SJunchao Zhang } 4450d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4451d67d9f35SJunchao Zhang } 4452d67d9f35SJunchao Zhang 4453d67d9f35SJunchao Zhang /*@C 445411a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4455d67d9f35SJunchao Zhang 4456d67d9f35SJunchao Zhang Not Collective 4457d67d9f35SJunchao Zhang 4458d67d9f35SJunchao Zhang Input Parameter: 445911a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 4460d67d9f35SJunchao Zhang 4461d67d9f35SJunchao Zhang Output Parameter: 4462d67d9f35SJunchao Zhang . array - pointer to the data 4463d67d9f35SJunchao Zhang 4464d67d9f35SJunchao Zhang Level: intermediate 4465d67d9f35SJunchao Zhang 4466db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4467d67d9f35SJunchao Zhang @*/ 4468d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array) 4469d71ae5a4SJacob Faibussowitsch { 4470d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4471d67d9f35SJunchao Zhang 4472d67d9f35SJunchao Zhang PetscFunctionBegin; 4473d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 44749566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4475d67d9f35SJunchao Zhang } else { 4476d67d9f35SJunchao Zhang *array = aij->a; 4477d67d9f35SJunchao Zhang } 44789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44799566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 4480d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4481d67d9f35SJunchao Zhang } 4482d67d9f35SJunchao Zhang 4483d67d9f35SJunchao Zhang /*@C 4484d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4485d67d9f35SJunchao Zhang 4486d67d9f35SJunchao Zhang Not Collective 4487d67d9f35SJunchao Zhang 4488d67d9f35SJunchao Zhang Input Parameter: 4489d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4490d67d9f35SJunchao Zhang 4491d67d9f35SJunchao Zhang Output Parameter: 4492d67d9f35SJunchao Zhang . array - pointer to the data 4493d67d9f35SJunchao Zhang 4494d67d9f35SJunchao Zhang Level: intermediate 4495d67d9f35SJunchao Zhang 4496db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4497d67d9f35SJunchao Zhang @*/ 4498d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array) 4499d71ae5a4SJacob Faibussowitsch { 4500d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4501d67d9f35SJunchao Zhang 4502d67d9f35SJunchao Zhang PetscFunctionBegin; 4503d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45049566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4505d67d9f35SJunchao Zhang } else { 4506d67d9f35SJunchao Zhang *array = NULL; 4507d67d9f35SJunchao Zhang } 45088f1ea47aSStefano Zampini PetscFunctionReturn(0); 45098f1ea47aSStefano Zampini } 45108f1ea47aSStefano Zampini 45118f1ea47aSStefano Zampini /*@C 451211a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45137ee59b9bSJunchao Zhang 45147ee59b9bSJunchao Zhang Not Collective 45157ee59b9bSJunchao Zhang 45167ee59b9bSJunchao Zhang Input Parameter: 451711a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45187ee59b9bSJunchao Zhang 45197ee59b9bSJunchao Zhang Output Parameters: 45207ee59b9bSJunchao Zhang + i - row map array of the matrix 45217ee59b9bSJunchao Zhang . j - column index array of the matrix 45227ee59b9bSJunchao Zhang . a - data array of the matrix 45237ee59b9bSJunchao Zhang - memtype - memory type of the arrays 45247ee59b9bSJunchao Zhang 45257ee59b9bSJunchao Zhang Notes: 45267ee59b9bSJunchao Zhang Any of the output parameters can be NULL, in which case the corresponding value is not returned. 45277ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45287ee59b9bSJunchao Zhang 45297ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45307ee59b9bSJunchao Zhang If the matrix is assembled, the data array 'a' is guaranteed to have the latest values of the matrix. 45317ee59b9bSJunchao Zhang 45327ee59b9bSJunchao Zhang Level: Developer 45337ee59b9bSJunchao Zhang 4534db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45357ee59b9bSJunchao Zhang @*/ 4536d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype) 4537d71ae5a4SJacob Faibussowitsch { 45387ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45397ee59b9bSJunchao Zhang 45407ee59b9bSJunchao Zhang PetscFunctionBegin; 45417ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45427ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45437ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45447ee59b9bSJunchao Zhang } else { 45457ee59b9bSJunchao Zhang if (i) *i = aij->i; 45467ee59b9bSJunchao Zhang if (j) *j = aij->j; 45477ee59b9bSJunchao Zhang if (a) *a = aij->a; 45487ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 45497ee59b9bSJunchao Zhang } 45507ee59b9bSJunchao Zhang PetscFunctionReturn(0); 45517ee59b9bSJunchao Zhang } 45527ee59b9bSJunchao Zhang 45537ee59b9bSJunchao Zhang /*@C 455421e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 455521e72a00SBarry Smith 455621e72a00SBarry Smith Not Collective 455721e72a00SBarry Smith 455821e72a00SBarry Smith Input Parameter: 455911a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 456021e72a00SBarry Smith 456121e72a00SBarry Smith Output Parameter: 456221e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 456321e72a00SBarry Smith 456421e72a00SBarry Smith Level: intermediate 456521e72a00SBarry Smith 4566db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 456721e72a00SBarry Smith @*/ 4568d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4569d71ae5a4SJacob Faibussowitsch { 457021e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 457121e72a00SBarry Smith 457221e72a00SBarry Smith PetscFunctionBegin; 457321e72a00SBarry Smith *nz = aij->rmax; 457421e72a00SBarry Smith PetscFunctionReturn(0); 457521e72a00SBarry Smith } 457621e72a00SBarry Smith 4577d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4578d71ae5a4SJacob Faibussowitsch { 4579394ed5ebSJunchao Zhang MPI_Comm comm; 4580394ed5ebSJunchao Zhang PetscInt *i, *j; 4581394ed5ebSJunchao Zhang PetscInt M, N, row; 4582394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4583394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4584394ed5ebSJunchao Zhang PetscInt *Aj; 4585394ed5ebSJunchao Zhang PetscScalar *Aa; 4586cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)(mat->data); 4587cbc6b225SStefano Zampini MatType rtype; 4588394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 4589394ed5ebSJunchao Zhang 4590394ed5ebSJunchao Zhang PetscFunctionBegin; 45919566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(mat)); 45929566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 45939566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4594e8729f6fSJunchao Zhang i = coo_i; 4595e8729f6fSJunchao Zhang j = coo_j; 45969566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 4597394ed5ebSJunchao Zhang for (k = 0; k < coo_n; k++) { /* Ignore entries with negative row or col indices */ 4598394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4599394ed5ebSJunchao Zhang perm[k] = k; 4600394ed5ebSJunchao Zhang } 4601394ed5ebSJunchao Zhang 4602394ed5ebSJunchao Zhang /* Sort by row */ 46039566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 46049371c9d4SSatish Balay for (k = 0; k < coo_n; k++) { 46059371c9d4SSatish Balay if (i[k] >= 0) break; 46069371c9d4SSatish Balay } /* Advance k to the first row with a non-negative index */ 4607394ed5ebSJunchao Zhang nneg = k; 46089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4609394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 4610394ed5ebSJunchao Zhang jmap++; /* Inc jmap by 1 for convinience */ 4611394ed5ebSJunchao Zhang 46129566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M + 1, &Ai)); /* CSR of A */ 46139566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4614394ed5ebSJunchao Zhang 4615394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 4616394ed5ebSJunchao Zhang Ai++; /* Inc by 1 for convinience */ 4617394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4618394ed5ebSJunchao Zhang while (k < coo_n) { 4619394ed5ebSJunchao Zhang row = i[k]; 4620394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4621394ed5ebSJunchao Zhang while (k < coo_n && i[k] == row) k++; 4622394ed5ebSJunchao Zhang end = k; 46239566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4624394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4625394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4626394ed5ebSJunchao Zhang jmap[q] = 1; /* Number of repeats of this nozero entry */ 4627394ed5ebSJunchao Zhang Ai[row] = 1; 4628394ed5ebSJunchao Zhang nnz++; 4629394ed5ebSJunchao Zhang 4630394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4631394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4632394ed5ebSJunchao Zhang q++; 4633394ed5ebSJunchao Zhang jmap[q] = 1; 4634394ed5ebSJunchao Zhang Aj[q] = j[p]; 4635394ed5ebSJunchao Zhang Ai[row]++; 4636394ed5ebSJunchao Zhang nnz++; 4637394ed5ebSJunchao Zhang } else { 4638394ed5ebSJunchao Zhang jmap[q]++; 4639394ed5ebSJunchao Zhang } 4640394ed5ebSJunchao Zhang } 4641394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4642394ed5ebSJunchao Zhang } 4643394ed5ebSJunchao Zhang 4644394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4645394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 4646394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4647394ed5ebSJunchao Zhang jmap[0] = 0; 4648394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 4649394ed5ebSJunchao Zhang if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */ 4650394ed5ebSJunchao Zhang PetscCount *jmap_new; 4651394ed5ebSJunchao Zhang PetscInt *Aj_new; 4652394ed5ebSJunchao Zhang 46539566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 46549566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 46559566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4656394ed5ebSJunchao Zhang jmap = jmap_new; 4657394ed5ebSJunchao Zhang 46589566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &Aj_new)); 46599566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 46609566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4661394ed5ebSJunchao Zhang Aj = Aj_new; 4662394ed5ebSJunchao Zhang } 4663394ed5ebSJunchao Zhang 4664394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4665394ed5ebSJunchao Zhang PetscCount *perm_new; 4666cbc6b225SStefano Zampini 46679566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 46689566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 46699566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4670394ed5ebSJunchao Zhang perm = perm_new; 4671394ed5ebSJunchao Zhang } 4672394ed5ebSJunchao Zhang 46739566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 46749566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */ 46759566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4676394ed5ebSJunchao Zhang 4677394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4678394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 4679394ed5ebSJunchao Zhang /* Record COO fields */ 4680394ed5ebSJunchao Zhang seqaij->coo_n = coo_n; 4681394ed5ebSJunchao Zhang seqaij->Atot = coo_n - nneg; /* Annz is seqaij->nz, so no need to record that again */ 4682394ed5ebSJunchao Zhang seqaij->jmap = jmap; /* of length nnz+1 */ 4683394ed5ebSJunchao Zhang seqaij->perm = perm; 4684394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4685394ed5ebSJunchao Zhang } 4686394ed5ebSJunchao Zhang 4687d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4688d71ae5a4SJacob Faibussowitsch { 4689394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4690394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 4691394ed5ebSJunchao Zhang PetscCount *perm = aseq->perm, *jmap = aseq->jmap; 4692394ed5ebSJunchao Zhang PetscScalar *Aa; 4693394ed5ebSJunchao Zhang 4694394ed5ebSJunchao Zhang PetscFunctionBegin; 46959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4696394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4697b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4698b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4699b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4700394ed5ebSJunchao Zhang } 47019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 4702394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4703394ed5ebSJunchao Zhang } 4704394ed5ebSJunchao Zhang 470534b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47065063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 470702fe1965SBarry Smith #endif 47083d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47095063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 47103d0639e7SStefano Zampini #endif 471102fe1965SBarry Smith 4712d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4713d71ae5a4SJacob Faibussowitsch { 4714273d9f13SBarry Smith Mat_SeqAIJ *b; 471538baddfdSBarry Smith PetscMPIInt size; 4716273d9f13SBarry Smith 4717273d9f13SBarry Smith PetscFunctionBegin; 47189566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 471908401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4720273d9f13SBarry Smith 47214dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 47222205254eSKarl Rupp 4723b0a32e0cSBarry Smith B->data = (void *)b; 47242205254eSKarl Rupp 47259566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps))); 4726071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 47272205254eSKarl Rupp 4728f4259b30SLisandro Dalcin b->row = NULL; 4729f4259b30SLisandro Dalcin b->col = NULL; 4730f4259b30SLisandro Dalcin b->icol = NULL; 4731b810aeb4SBarry Smith b->reallocs = 0; 473236db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4733f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4734416022c9SBarry Smith b->nonew = 0; 4735f4259b30SLisandro Dalcin b->diag = NULL; 4736f4259b30SLisandro Dalcin b->solve_work = NULL; 4737f4259b30SLisandro Dalcin B->spptr = NULL; 4738f4259b30SLisandro Dalcin b->saved_values = NULL; 4739f4259b30SLisandro Dalcin b->idiag = NULL; 4740f4259b30SLisandro Dalcin b->mdiag = NULL; 4741f4259b30SLisandro Dalcin b->ssor_work = NULL; 474271f1c65dSBarry Smith b->omega = 1.0; 474371f1c65dSBarry Smith b->fshift = 0.0; 474471f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4745bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4746a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 474717ab2063SBarry Smith 47489566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4749d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 47509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 47519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4752b3866ffcSBarry Smith #endif 47539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 47549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 47559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 47569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 47579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 47589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 47599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 47609779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 47619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4762191b95cbSRichard Tran Mills #endif 476334b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 47659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 47669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 476702fe1965SBarry Smith #endif 47683d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 47703d0639e7SStefano Zampini #endif 47719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4772af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 47739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4774af8000cdSHong Zhang #endif 4775d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 47769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4777d24d4204SJose E. Roman #endif 477863c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 47799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 47809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 478163c07aadSStefano Zampini #endif 47829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 47839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 47849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 47859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 47869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsTranspose_SeqAIJ)); 47879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 47889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 47899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 47909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 47919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 47929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 47939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 47949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 47959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 47969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 47979566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 47989566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 47999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 48003a40ed3dSBarry Smith PetscFunctionReturn(0); 480117ab2063SBarry Smith } 480217ab2063SBarry Smith 4803b24902e0SBarry Smith /* 48043893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4805b24902e0SBarry Smith */ 4806d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4807d71ae5a4SJacob Faibussowitsch { 48082a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4809071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 481017ab2063SBarry Smith 48113a40ed3dSBarry Smith PetscFunctionBegin; 4812aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4813273d9f13SBarry Smith 4814d5f3da31SBarry Smith C->factortype = A->factortype; 4815f4259b30SLisandro Dalcin c->row = NULL; 4816f4259b30SLisandro Dalcin c->col = NULL; 4817f4259b30SLisandro Dalcin c->icol = NULL; 48186ad4291fSHong Zhang c->reallocs = 0; 481917ab2063SBarry Smith 482069272f91SPierre Jolivet C->assembled = A->assembled; 482169272f91SPierre Jolivet C->preallocated = A->preallocated; 482217ab2063SBarry Smith 482369272f91SPierre Jolivet if (A->preallocated) { 48249566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 48259566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4826eec197d1SBarry Smith 48279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 48289566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 48299566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 48309566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 483117ab2063SBarry Smith 483217ab2063SBarry Smith /* allocate the matrix space */ 4833f77e22a1SHong Zhang if (mallocmatspace) { 48349566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i)); 48352205254eSKarl Rupp 4836f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 48372205254eSKarl Rupp 48389566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 483917ab2063SBarry Smith if (m > 0) { 48409566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4841be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 48422e5835c6SStefano Zampini const PetscScalar *aa; 48432e5835c6SStefano Zampini 48449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 48459566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 48469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 4847be6bf707SBarry Smith } else { 48489566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 484917ab2063SBarry Smith } 485008480c60SBarry Smith } 4851f77e22a1SHong Zhang } 485217ab2063SBarry Smith 48536ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4854416022c9SBarry Smith c->roworiented = a->roworiented; 4855416022c9SBarry Smith c->nonew = a->nonew; 4856416022c9SBarry Smith if (a->diag) { 48579566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 48589566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 4859071fcb05SBarry Smith } else c->diag = NULL; 48602205254eSKarl Rupp 4861f4259b30SLisandro Dalcin c->solve_work = NULL; 4862f4259b30SLisandro Dalcin c->saved_values = NULL; 4863f4259b30SLisandro Dalcin c->idiag = NULL; 4864f4259b30SLisandro Dalcin c->ssor_work = NULL; 4865a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4866e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4867e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 48686ad4291fSHong Zhang 4869893ad86cSHong Zhang c->rmax = a->rmax; 4870416022c9SBarry Smith c->nz = a->nz; 48718ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4872754ec7b1SSatish Balay 48736ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 48746ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4875cd6b891eSBarry Smith if (a->compressedrow.use) { 48766ad4291fSHong Zhang i = a->compressedrow.nrows; 48779566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 48789566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 48799566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 488027ea64f8SHong Zhang } else { 488127ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 48820298fd71SBarry Smith c->compressedrow.i = NULL; 48830298fd71SBarry Smith c->compressedrow.rindex = NULL; 48846ad4291fSHong Zhang } 4885ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4886e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 48874846f1f5SKris Buschelman 48889566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 488969272f91SPierre Jolivet } 48909566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 48913a40ed3dSBarry Smith PetscFunctionReturn(0); 489217ab2063SBarry Smith } 489317ab2063SBarry Smith 4894d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 4895d71ae5a4SJacob Faibussowitsch { 4896b24902e0SBarry Smith PetscFunctionBegin; 48979566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 48989566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 489948a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 49009566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 49019566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 4902b24902e0SBarry Smith PetscFunctionReturn(0); 4903b24902e0SBarry Smith } 4904b24902e0SBarry Smith 4905d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4906d71ae5a4SJacob Faibussowitsch { 490752f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 490852f91c60SVaclav Hapla 490952f91c60SVaclav Hapla PetscFunctionBegin; 491052f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 491152f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 4912c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 49139566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 49149566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 49159566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 491652f91c60SVaclav Hapla if (isbinary) { 49179566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 491852f91c60SVaclav Hapla } else if (ishdf5) { 491952f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 49209566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 492152f91c60SVaclav Hapla #else 492252f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 492352f91c60SVaclav Hapla #endif 492452f91c60SVaclav Hapla } else { 492598921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 492652f91c60SVaclav Hapla } 492752f91c60SVaclav Hapla PetscFunctionReturn(0); 492852f91c60SVaclav Hapla } 492952f91c60SVaclav Hapla 4930d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 4931d71ae5a4SJacob Faibussowitsch { 49323ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 49333ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 4934fbdbba38SShri Abhyankar 4935fbdbba38SShri Abhyankar PetscFunctionBegin; 49369566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 4937bbead8a2SBarry Smith 49383ea6fe3dSLisandro Dalcin /* read in matrix header */ 49399566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 494008401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 49419371c9d4SSatish Balay M = header[1]; 49429371c9d4SSatish Balay N = header[2]; 49439371c9d4SSatish Balay nz = header[3]; 494408401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 494508401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 494608401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 4947fbdbba38SShri Abhyankar 49483ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 49499566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 49503ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 49513ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 49523ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 49533ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 49543ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 49559566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 49569566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 49573ea6fe3dSLisandro Dalcin 49583ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 49599566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 4960aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 49613ea6fe3dSLisandro Dalcin 4962fbdbba38SShri Abhyankar /* read in row lengths */ 49639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 49649566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 49653ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 49669371c9d4SSatish Balay sum = 0; 49679371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 496808401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 49693ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 49709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 49719566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 4972aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 49733ea6fe3dSLisandro Dalcin /* store row lengths */ 49749566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 49759566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 4976fbdbba38SShri Abhyankar 49773ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 49789371c9d4SSatish Balay a->i[0] = 0; 49799371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 49803ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 49819566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 49823ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 49839566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 4984fbdbba38SShri Abhyankar 49859566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 49869566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 4987fbdbba38SShri Abhyankar PetscFunctionReturn(0); 4988fbdbba38SShri Abhyankar } 4989fbdbba38SShri Abhyankar 4990d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 4991d71ae5a4SJacob Faibussowitsch { 49927264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 4993fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4994eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4995eeffb40dSHong Zhang PetscInt k; 4996eeffb40dSHong Zhang #endif 49977264ac53SSatish Balay 49983a40ed3dSBarry Smith PetscFunctionBegin; 4999bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5000d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5001ca44d042SBarry Smith *flg = PETSC_FALSE; 5002ca44d042SBarry Smith PetscFunctionReturn(0); 5003bcd2baecSBarry Smith } 50047264ac53SSatish Balay 50057264ac53SSatish Balay /* if the a->i are the same */ 50069566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 5007abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 50087264ac53SSatish Balay 50097264ac53SSatish Balay /* if a->j are the same */ 50109566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 5011abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 5012bcd2baecSBarry Smith 50139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5015bcd2baecSBarry Smith /* if a->a are the same */ 5016eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5017eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5018fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5019eeffb40dSHong Zhang *flg = PETSC_FALSE; 50203a40ed3dSBarry Smith PetscFunctionReturn(0); 5021eeffb40dSHong Zhang } 5022eeffb40dSHong Zhang } 5023eeffb40dSHong Zhang #else 50249566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5025eeffb40dSHong Zhang #endif 50269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 50279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 5028eeffb40dSHong Zhang PetscFunctionReturn(0); 50297264ac53SSatish Balay } 503036db0b34SBarry Smith 503105869f15SSatish Balay /*@ 503211a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 503336db0b34SBarry Smith provided by the user. 503436db0b34SBarry Smith 5035d083f849SBarry Smith Collective 503636db0b34SBarry Smith 503736db0b34SBarry Smith Input Parameters: 503836db0b34SBarry Smith + comm - must be an MPI communicator of size 1 503936db0b34SBarry Smith . m - number of rows 504036db0b34SBarry Smith . n - number of columns 5041483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 504236db0b34SBarry Smith . j - column indices 504336db0b34SBarry Smith - a - matrix values 504436db0b34SBarry Smith 504536db0b34SBarry Smith Output Parameter: 504636db0b34SBarry Smith . mat - the matrix 504736db0b34SBarry Smith 504836db0b34SBarry Smith Level: intermediate 504936db0b34SBarry Smith 505036db0b34SBarry Smith Notes: 50510551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 5052292fb18eSBarry Smith once the matrix is destroyed and not before 505336db0b34SBarry Smith 505436db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 505536db0b34SBarry Smith 5056bfeeae90SHong Zhang The i and j indices are 0 based 505736db0b34SBarry Smith 5058a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5059a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 50608eef79e4SBarry Smith as shown 5061a4552177SSatish Balay 50628eef79e4SBarry Smith $ 1 0 0 50638eef79e4SBarry Smith $ 2 0 3 50648eef79e4SBarry Smith $ 4 5 6 50658eef79e4SBarry Smith $ 50668eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 50678eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 50688eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 5069a4552177SSatish Balay 5070db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 507136db0b34SBarry Smith @*/ 5072d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5073d71ae5a4SJacob Faibussowitsch { 5074cbcfb4deSHong Zhang PetscInt ii; 507536db0b34SBarry Smith Mat_SeqAIJ *aij; 5076cbcfb4deSHong Zhang PetscInt jj; 507736db0b34SBarry Smith 507836db0b34SBarry Smith PetscFunctionBegin; 5079aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 50809566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 50819566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 50829566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 50839566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 50849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5085ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 50869566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 50879566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5088ab93d7beSBarry Smith 508936db0b34SBarry Smith aij->i = i; 509036db0b34SBarry Smith aij->j = j; 509136db0b34SBarry Smith aij->a = a; 509236db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 509336db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5094e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5095e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 509636db0b34SBarry Smith 5097cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 509836db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 509976bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5100aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 51019985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 510208401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 510308401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 51049985e31cSBarry Smith } 510536db0b34SBarry Smith } 510676bd3646SJed Brown } 510776bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 510836db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 510908401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5110aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 511136db0b34SBarry Smith } 511276bd3646SJed Brown } 511336db0b34SBarry Smith 51149566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 51159566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 511636db0b34SBarry Smith PetscFunctionReturn(0); 511736db0b34SBarry Smith } 5118cbc6b225SStefano Zampini 5119f62e3866SBarry Smith /*@ 512011a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 51218a0b0e6bSVictor Minden provided by the user. 51228a0b0e6bSVictor Minden 5123d083f849SBarry Smith Collective 51248a0b0e6bSVictor Minden 51258a0b0e6bSVictor Minden Input Parameters: 51268a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 51278a0b0e6bSVictor Minden . m - number of rows 51288a0b0e6bSVictor Minden . n - number of columns 51298a0b0e6bSVictor Minden . i - row indices 51308a0b0e6bSVictor Minden . j - column indices 51311230e6d1SVictor Minden . a - matrix values 51321230e6d1SVictor Minden . nz - number of nonzeros 513311a5261eSBarry Smith - idx - if the i and j indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 51348a0b0e6bSVictor Minden 51358a0b0e6bSVictor Minden Output Parameter: 51368a0b0e6bSVictor Minden . mat - the matrix 51378a0b0e6bSVictor Minden 51388a0b0e6bSVictor Minden Level: intermediate 51398a0b0e6bSVictor Minden 5140f62e3866SBarry Smith Example: 5141f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 51429e99939fSJunchao Zhang .vb 51438a0b0e6bSVictor Minden 1 0 0 51448a0b0e6bSVictor Minden 2 0 3 51458a0b0e6bSVictor Minden 4 5 6 51468a0b0e6bSVictor Minden 51478a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 51488a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 51498a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 51509e99939fSJunchao Zhang .ve 5151d7547e51SJunchao Zhang Notes: 5152d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5153d7547e51SJunchao Zhang and are particularly useful in iterative applications. 51548a0b0e6bSVictor Minden 5155d7547e51SJunchao Zhang .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 51568a0b0e6bSVictor Minden @*/ 5157d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5158d71ae5a4SJacob Faibussowitsch { 5159d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 51608a0b0e6bSVictor Minden 51618a0b0e6bSVictor Minden PetscFunctionBegin; 51629566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5163ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 51649566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51659566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51669566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 51681230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 51691230e6d1SVictor Minden if (idx) { 51701230e6d1SVictor Minden row = i[ii] - 1; 51711230e6d1SVictor Minden col = j[ii] - 1; 51721230e6d1SVictor Minden } else { 51731230e6d1SVictor Minden row = i[ii]; 51741230e6d1SVictor Minden col = j[ii]; 51758a0b0e6bSVictor Minden } 51769566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 51778a0b0e6bSVictor Minden } 51789566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 51799566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 51809566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 51818a0b0e6bSVictor Minden PetscFunctionReturn(0); 51828a0b0e6bSVictor Minden } 518336db0b34SBarry Smith 5184d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5185d71ae5a4SJacob Faibussowitsch { 5186acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5187acf2f550SJed Brown 5188acf2f550SJed Brown PetscFunctionBegin; 5189acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5190acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 51912205254eSKarl Rupp 51929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 5193acf2f550SJed Brown PetscFunctionReturn(0); 5194acf2f550SJed Brown } 5195acf2f550SJed Brown 5196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5197d71ae5a4SJacob Faibussowitsch { 51989c8f2541SHong Zhang PetscFunctionBegin; 51999566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 52009c8f2541SHong Zhang PetscFunctionReturn(0); 52019c8f2541SHong Zhang } 52029c8f2541SHong Zhang 520381824310SBarry Smith /* 520453dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 520553dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 520653dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 520753dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 520853dd7562SDmitry Karpeev */ 5209d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5210d71ae5a4SJacob Faibussowitsch { 521153dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 521253dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 521353dd7562SDmitry Karpeev PetscBool seqaij; 521453dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 521553dd7562SDmitry Karpeev PetscScalar v; 521653dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 521753dd7562SDmitry Karpeev 521853dd7562SDmitry Karpeev PetscFunctionBegin; 521953dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 522053dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 52219566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 522228b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 522353dd7562SDmitry Karpeev if (rowemb) { 52249566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 522508401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 522653dd7562SDmitry Karpeev } else { 522708401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 522853dd7562SDmitry Karpeev } 522953dd7562SDmitry Karpeev if (colemb) { 52309566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 523108401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 523253dd7562SDmitry Karpeev } else { 523308401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 523453dd7562SDmitry Karpeev } 523553dd7562SDmitry Karpeev 523653dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ *)(B->data); 523753dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 52389566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5239ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 52409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 52419566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 524253dd7562SDmitry Karpeev } 524348a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 524453dd7562SDmitry Karpeev count = 0; 524553dd7562SDmitry Karpeev rowindices = NULL; 524653dd7562SDmitry Karpeev colindices = NULL; 524748a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 524848a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 524953dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 525053dd7562SDmitry Karpeev PetscInt row; 525153dd7562SDmitry Karpeev row = i; 525253dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 525353dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 525453dd7562SDmitry Karpeev PetscInt col; 525553dd7562SDmitry Karpeev col = Baij->j[count]; 525653dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 525753dd7562SDmitry Karpeev v = Baij->a[count]; 52589566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 525953dd7562SDmitry Karpeev ++count; 526053dd7562SDmitry Karpeev } 526153dd7562SDmitry Karpeev } 526253dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 526353dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 526453dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 526553dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 526653dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 526753dd7562SDmitry Karpeev PetscFunctionReturn(0); 526853dd7562SDmitry Karpeev } 526953dd7562SDmitry Karpeev 5270dec0b466SHong Zhang PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A) 5271dec0b466SHong Zhang { 5272dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5273dec0b466SHong Zhang MatScalar *aa = a->a; 5274dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5275dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5276dec0b466SHong Zhang 5277dec0b466SHong Zhang PetscFunctionBegin; 5278dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5279dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5280dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5281dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5282dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 5283dec0b466SHong Zhang if (aa[k] == 0 && aj[k] != i - 1) fshift++; 5284dec0b466SHong Zhang else { 5285dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5286dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5287dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5288dec0b466SHong Zhang } 5289dec0b466SHong Zhang } 5290dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5291dec0b466SHong Zhang fshift_prev = fshift; 5292dec0b466SHong Zhang /* reset ilen and imax for each row */ 5293dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5294dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5295dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5296dec0b466SHong Zhang } 5297dec0b466SHong Zhang if (m) { 5298dec0b466SHong Zhang ai[m] -= fshift; 5299dec0b466SHong Zhang a->nz = ai[m]; 5300dec0b466SHong Zhang } 5301dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5302dec0b466SHong Zhang A->nonzerostate -= fshift; 5303dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5304dec0b466SHong Zhang a->rmax = rmax; 5305dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5306dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5307dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 5308dec0b466SHong Zhang PetscFunctionReturn(0); 5309dec0b466SHong Zhang } 5310dec0b466SHong Zhang 53114099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 53124099cc6bSBarry Smith 53134099cc6bSBarry Smith /*@C 531411a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 53154099cc6bSBarry Smith 531611a5261eSBarry Smith Collective on mat 53174099cc6bSBarry Smith 53184099cc6bSBarry Smith Input Parameters: 53194099cc6bSBarry Smith + mat - the matrix object 53204099cc6bSBarry Smith - matype - matrix type 53214099cc6bSBarry Smith 53224099cc6bSBarry Smith Options Database Key: 53234099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 53244099cc6bSBarry Smith 53254099cc6bSBarry Smith Level: intermediate 53264099cc6bSBarry Smith 5327db781477SPatrick Sanan .seealso: `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`, `Mat` 53284099cc6bSBarry Smith @*/ 5329d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5330d71ae5a4SJacob Faibussowitsch { 53314099cc6bSBarry Smith PetscBool sametype; 53325f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 53334099cc6bSBarry Smith 53344099cc6bSBarry Smith PetscFunctionBegin; 53354099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 53369566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 53374099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 53384099cc6bSBarry Smith 53399566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 53405f80ce2aSJacob Faibussowitsch PetscCheck(r, PETSC_COMM_SELF, PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 53419566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 53424099cc6bSBarry Smith PetscFunctionReturn(0); 53434099cc6bSBarry Smith } 53444099cc6bSBarry Smith 53454099cc6bSBarry Smith /*@C 534611a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 53474099cc6bSBarry Smith 53484099cc6bSBarry Smith Not Collective 53494099cc6bSBarry Smith 53504099cc6bSBarry Smith Input Parameters: 535111a5261eSBarry Smith + name - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 53524099cc6bSBarry Smith - function - routine to convert to subtype 53534099cc6bSBarry Smith 53544099cc6bSBarry Smith Notes: 535511a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 53564099cc6bSBarry Smith 53574099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 53584099cc6bSBarry Smith $ -mat_seqaij_type my_mat 53594099cc6bSBarry Smith 53604099cc6bSBarry Smith Level: advanced 53614099cc6bSBarry Smith 5362db781477SPatrick Sanan .seealso: `MatSeqAIJRegisterAll()` 53634099cc6bSBarry Smith @*/ 5364d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5365d71ae5a4SJacob Faibussowitsch { 53664099cc6bSBarry Smith PetscFunctionBegin; 53679566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 53689566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 53694099cc6bSBarry Smith PetscFunctionReturn(0); 53704099cc6bSBarry Smith } 53714099cc6bSBarry Smith 53724099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 53734099cc6bSBarry Smith 53744099cc6bSBarry Smith /*@C 537511a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 53764099cc6bSBarry Smith 53774099cc6bSBarry Smith Not Collective 53784099cc6bSBarry Smith 53794099cc6bSBarry Smith Level: advanced 53804099cc6bSBarry Smith 5381db781477SPatrick Sanan .seealso: `MatRegisterAll()`, `MatSeqAIJRegister()` 53824099cc6bSBarry Smith @*/ 5383d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5384d71ae5a4SJacob Faibussowitsch { 53854099cc6bSBarry Smith PetscFunctionBegin; 53864099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 53874099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 53884099cc6bSBarry Smith 53899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 53909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 53919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 53929779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 53939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5394485f9817SRichard Tran Mills #endif 53955063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 53969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 53975063d097SStefano Zampini #endif 53985063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 53999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 54005063d097SStefano Zampini #endif 54014099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 54029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 54034099cc6bSBarry Smith #endif 54044099cc6bSBarry Smith PetscFunctionReturn(0); 54054099cc6bSBarry Smith } 540653dd7562SDmitry Karpeev 540753dd7562SDmitry Karpeev /* 540881824310SBarry Smith Special version for direct calls from Fortran 540981824310SBarry Smith */ 5410af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 541181824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 541281824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 541381824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 541481824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 541581824310SBarry Smith #endif 541681824310SBarry Smith 541781824310SBarry Smith /* Change these macros so can be used in void function */ 541898921bdaSJacob Faibussowitsch 541998921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 54209566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 54219566063dSJacob Faibussowitsch #undef PetscCall 54229371c9d4SSatish Balay #define PetscCall(...) \ 54239371c9d4SSatish Balay do { \ 54245f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 542598921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 542698921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 542798921bdaSJacob Faibussowitsch return; \ 542898921bdaSJacob Faibussowitsch } \ 542998921bdaSJacob Faibussowitsch } while (0) 543098921bdaSJacob Faibussowitsch 543198921bdaSJacob Faibussowitsch #undef SETERRQ 54329371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 54339371c9d4SSatish Balay do { \ 543498921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 543598921bdaSJacob Faibussowitsch return; \ 543698921bdaSJacob Faibussowitsch } while (0) 543781824310SBarry Smith 5438d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5439d71ae5a4SJacob Faibussowitsch { 544081824310SBarry Smith Mat A = *AA; 544181824310SBarry Smith PetscInt m = *mm, n = *nn; 544281824310SBarry Smith InsertMode is = *isis; 544381824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 544481824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 544581824310SBarry Smith PetscInt *imax, *ai, *ailen; 544681824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 544754f21887SBarry Smith MatScalar *ap, value, *aa; 5448ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5449ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 545081824310SBarry Smith 545181824310SBarry Smith PetscFunctionBegin; 54524994cf47SJed Brown MatCheckPreallocated(A, 1); 545381824310SBarry Smith imax = a->imax; 545481824310SBarry Smith ai = a->i; 545581824310SBarry Smith ailen = a->ilen; 545681824310SBarry Smith aj = a->j; 545781824310SBarry Smith aa = a->a; 545881824310SBarry Smith 545981824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 546081824310SBarry Smith row = im[k]; 546181824310SBarry Smith if (row < 0) continue; 54625f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 54639371c9d4SSatish Balay rp = aj + ai[row]; 54649371c9d4SSatish Balay ap = aa + ai[row]; 54659371c9d4SSatish Balay rmax = imax[row]; 54669371c9d4SSatish Balay nrow = ailen[row]; 546781824310SBarry Smith low = 0; 546881824310SBarry Smith high = nrow; 546981824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 547081824310SBarry Smith if (in[l] < 0) continue; 54715f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 547281824310SBarry Smith col = in[l]; 54732205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 54742205254eSKarl Rupp else value = v[k + l * m]; 54752205254eSKarl Rupp 547681824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 547781824310SBarry Smith 54782205254eSKarl Rupp if (col <= lastcol) low = 0; 54792205254eSKarl Rupp else high = nrow; 548081824310SBarry Smith lastcol = col; 548181824310SBarry Smith while (high - low > 5) { 548281824310SBarry Smith t = (low + high) / 2; 548381824310SBarry Smith if (rp[t] > col) high = t; 548481824310SBarry Smith else low = t; 548581824310SBarry Smith } 548681824310SBarry Smith for (i = low; i < high; i++) { 548781824310SBarry Smith if (rp[i] > col) break; 548881824310SBarry Smith if (rp[i] == col) { 548981824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 549081824310SBarry Smith else ap[i] = value; 549181824310SBarry Smith goto noinsert; 549281824310SBarry Smith } 549381824310SBarry Smith } 549481824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 549581824310SBarry Smith if (nonew == 1) goto noinsert; 54965f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5497fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 54989371c9d4SSatish Balay N = nrow++ - 1; 54999371c9d4SSatish Balay a->nz++; 55009371c9d4SSatish Balay high++; 550181824310SBarry Smith /* shift up all the later entries in this row */ 550281824310SBarry Smith for (ii = N; ii >= i; ii--) { 550381824310SBarry Smith rp[ii + 1] = rp[ii]; 550481824310SBarry Smith ap[ii + 1] = ap[ii]; 550581824310SBarry Smith } 550681824310SBarry Smith rp[i] = col; 550781824310SBarry Smith ap[i] = value; 5508e56f5c9eSBarry Smith A->nonzerostate++; 550981824310SBarry Smith noinsert:; 551081824310SBarry Smith low = i + 1; 551181824310SBarry Smith } 551281824310SBarry Smith ailen[row] = nrow; 551381824310SBarry Smith } 551481824310SBarry Smith PetscFunctionReturnVoid(); 551581824310SBarry Smith } 551698921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 551798921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 551898921bdaSJacob Faibussowitsch * original definitions */ 55199566063dSJacob Faibussowitsch #undef PetscCall 552098921bdaSJacob Faibussowitsch #undef SETERRQ 5521