1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 11d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 12d71ae5a4SJacob Faibussowitsch { 134099cc6bSBarry Smith PetscBool flg; 144099cc6bSBarry Smith char type[256]; 154099cc6bSBarry Smith 164099cc6bSBarry Smith PetscFunctionBegin; 17d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 189566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 199566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 20d0609cedSBarry Smith PetscOptionsEnd(); 214099cc6bSBarry Smith PetscFunctionReturn(0); 224099cc6bSBarry Smith } 234099cc6bSBarry Smith 24d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 25d71ae5a4SJacob Faibussowitsch { 260716a85fSBarry Smith PetscInt i, m, n; 270716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 280716a85fSBarry Smith 290716a85fSBarry Smith PetscFunctionBegin; 309566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 319566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 320716a85fSBarry Smith if (type == NORM_2) { 33ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 340716a85fSBarry Smith } else if (type == NORM_1) { 35ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 360716a85fSBarry Smith } else if (type == NORM_INFINITY) { 37ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 38857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 39ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 40857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 42857cbf51SRichard Tran Mills } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 430716a85fSBarry Smith 440716a85fSBarry Smith if (type == NORM_2) { 45a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 47a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 480716a85fSBarry Smith } 490716a85fSBarry Smith PetscFunctionReturn(0); 500716a85fSBarry Smith } 510716a85fSBarry Smith 52d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 53d71ae5a4SJacob Faibussowitsch { 543a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 553a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 563a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 573a062f41SBarry Smith PetscInt *rows; 583a062f41SBarry Smith 593a062f41SBarry Smith PetscFunctionBegin; 603a062f41SBarry Smith for (i = 0; i < m; i++) { 61ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 623a062f41SBarry Smith } 639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 643a062f41SBarry Smith cnt = 0; 653a062f41SBarry Smith for (i = 0; i < m; i++) { 663a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 673a062f41SBarry Smith rows[cnt] = i; 683a062f41SBarry Smith cnt++; 693a062f41SBarry Smith } 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 723a062f41SBarry Smith PetscFunctionReturn(0); 733a062f41SBarry Smith } 743a062f41SBarry Smith 75d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 76d71ae5a4SJacob Faibussowitsch { 776ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 78fff043a9SJunchao Zhang const MatScalar *aa; 796ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 80b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 816ce1633cSBarry Smith PetscInt *rows; 826ce1633cSBarry Smith 836ce1633cSBarry Smith PetscFunctionBegin; 849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 859566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 866ce1633cSBarry Smith diag = a->diag; 876ce1633cSBarry Smith for (i = 0; i < m; i++) { 88ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 896ce1633cSBarry Smith } 909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 916ce1633cSBarry Smith cnt = 0; 926ce1633cSBarry Smith for (i = 0; i < m; i++) { 93ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 946ce1633cSBarry Smith } 95f1f41ecbSJed Brown *nrows = cnt; 96f1f41ecbSJed Brown *zrows = rows; 979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 98f1f41ecbSJed Brown PetscFunctionReturn(0); 99f1f41ecbSJed Brown } 100f1f41ecbSJed Brown 101d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 102d71ae5a4SJacob Faibussowitsch { 103f1f41ecbSJed Brown PetscInt nrows, *rows; 104f1f41ecbSJed Brown 105f1f41ecbSJed Brown PetscFunctionBegin; 1060298fd71SBarry Smith *zrows = NULL; 1079566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1089566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1096ce1633cSBarry Smith PetscFunctionReturn(0); 1106ce1633cSBarry Smith } 1116ce1633cSBarry Smith 112d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 113d71ae5a4SJacob Faibussowitsch { 114b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 115b3a44c85SBarry Smith const MatScalar *aa; 116b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 117b3a44c85SBarry Smith const PetscInt *ii; 118b3a44c85SBarry Smith PetscInt n, i, j, *rows; 119b3a44c85SBarry Smith 120b3a44c85SBarry Smith PetscFunctionBegin; 1219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 122f4259b30SLisandro Dalcin *keptrows = NULL; 123b3a44c85SBarry Smith ii = a->i; 124b3a44c85SBarry Smith for (i = 0; i < m; i++) { 125b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 126b3a44c85SBarry Smith if (!n) { 127b3a44c85SBarry Smith cnt++; 128b3a44c85SBarry Smith goto ok1; 129b3a44c85SBarry Smith } 1302e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 131b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 132b3a44c85SBarry Smith } 133b3a44c85SBarry Smith cnt++; 134b3a44c85SBarry Smith ok1:; 135b3a44c85SBarry Smith } 1362e5835c6SStefano Zampini if (!cnt) { 1379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1382e5835c6SStefano Zampini PetscFunctionReturn(0); 1392e5835c6SStefano Zampini } 1409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 141b3a44c85SBarry Smith cnt = 0; 142b3a44c85SBarry Smith for (i = 0; i < m; i++) { 143b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 144b3a44c85SBarry Smith if (!n) continue; 1452e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 146b3a44c85SBarry Smith if (aa[j] != 0.0) { 147b3a44c85SBarry Smith rows[cnt++] = i; 148b3a44c85SBarry Smith break; 149b3a44c85SBarry Smith } 150b3a44c85SBarry Smith } 151b3a44c85SBarry Smith } 1529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1539566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 154b3a44c85SBarry Smith PetscFunctionReturn(0); 155b3a44c85SBarry Smith } 156b3a44c85SBarry Smith 157d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 158d71ae5a4SJacob Faibussowitsch { 15979299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16099e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16199e65526SBarry Smith const PetscInt *diag; 1622e5835c6SStefano Zampini MatScalar *aa; 16399e65526SBarry Smith const PetscScalar *v; 164ace3abfcSBarry Smith PetscBool missing; 16579299369SBarry Smith 16679299369SBarry Smith PetscFunctionBegin; 16709f38230SBarry Smith if (Y->assembled) { 1689566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 16909f38230SBarry Smith if (!missing) { 17079299369SBarry Smith diag = aij->diag; 1719566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 17379299369SBarry Smith if (is == INSERT_VALUES) { 174ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 17579299369SBarry Smith } else { 176ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 17779299369SBarry Smith } 1789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1799566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 18079299369SBarry Smith PetscFunctionReturn(0); 18179299369SBarry Smith } 1829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 18309f38230SBarry Smith } 1849566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 18509f38230SBarry Smith PetscFunctionReturn(0); 18609f38230SBarry Smith } 18779299369SBarry Smith 188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 189d71ae5a4SJacob Faibussowitsch { 190416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19197f1f81fSBarry Smith PetscInt i, ishift; 19217ab2063SBarry Smith 1933a40ed3dSBarry Smith PetscFunctionBegin; 194f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 1953a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 196bfeeae90SHong Zhang ishift = 0; 197b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 1989566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 199bfeeae90SHong Zhang } else if (oshift == 1) { 2001a83f524SJed Brown PetscInt *tia; 201d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2023b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2041a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2051a83f524SJed Brown *ia = tia; 206ecc77c7aSBarry Smith if (ja) { 2071a83f524SJed Brown PetscInt *tja; 2089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2091a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2101a83f524SJed Brown *ja = tja; 211ecc77c7aSBarry Smith } 2126945ee14SBarry Smith } else { 213ecc77c7aSBarry Smith *ia = a->i; 214ecc77c7aSBarry Smith if (ja) *ja = a->j; 215a2ce50c7SBarry Smith } 2163a40ed3dSBarry Smith PetscFunctionReturn(0); 217a2744918SBarry Smith } 218a2744918SBarry Smith 219d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 220d71ae5a4SJacob Faibussowitsch { 2213a40ed3dSBarry Smith PetscFunctionBegin; 2223a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 223b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2249566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2259566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 226bcd2baecSBarry Smith } 2273a40ed3dSBarry Smith PetscFunctionReturn(0); 22817ab2063SBarry Smith } 22917ab2063SBarry Smith 230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 231d71ae5a4SJacob Faibussowitsch { 2323b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 233d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 23497f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2353b2fbd54SBarry Smith 2363a40ed3dSBarry Smith PetscFunctionBegin; 237899cda47SBarry Smith *nn = n; 2383a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2393b2fbd54SBarry Smith if (symmetric) { 2409566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2413b2fbd54SBarry Smith } else { 2429566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2453b2fbd54SBarry Smith jj = a->j; 246ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2473b2fbd54SBarry Smith cia[0] = oshift; 248ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2499566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2503b2fbd54SBarry Smith jj = a->j; 251a93ec695SBarry Smith for (row = 0; row < m; row++) { 252a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 253a93ec695SBarry Smith for (i = 0; i < mr; i++) { 254bfeeae90SHong Zhang col = *jj++; 2552205254eSKarl Rupp 2563b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2573b2fbd54SBarry Smith } 2583b2fbd54SBarry Smith } 2599566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2609371c9d4SSatish Balay *ia = cia; 2619371c9d4SSatish Balay *ja = cja; 2623b2fbd54SBarry Smith } 2633a40ed3dSBarry Smith PetscFunctionReturn(0); 2643b2fbd54SBarry Smith } 2653b2fbd54SBarry Smith 266d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 267d71ae5a4SJacob Faibussowitsch { 2683a40ed3dSBarry Smith PetscFunctionBegin; 2693a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2703b2fbd54SBarry Smith 2719566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2729566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2733a40ed3dSBarry Smith PetscFunctionReturn(0); 2743b2fbd54SBarry Smith } 2753b2fbd54SBarry Smith 2767cee066cSHong Zhang /* 2777cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2787cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 279040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2807cee066cSHong Zhang */ 281d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 282d71ae5a4SJacob Faibussowitsch { 2837cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2847cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 285071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2867cee066cSHong Zhang PetscInt *cspidx; 287071fcb05SBarry Smith const PetscInt *jj; 2887cee066cSHong Zhang 2897cee066cSHong Zhang PetscFunctionBegin; 2907cee066cSHong Zhang *nn = n; 2917cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 292625f6d37SHong Zhang 2939566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2959566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2969566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 2977cee066cSHong Zhang jj = a->j; 298ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2997cee066cSHong Zhang cia[0] = oshift; 300ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3019566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3027cee066cSHong Zhang jj = a->j; 3037cee066cSHong Zhang for (row = 0; row < m; row++) { 3047cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3057cee066cSHong Zhang for (i = 0; i < mr; i++) { 3067cee066cSHong Zhang col = *jj++; 307071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 308071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 309071fcb05SBarry Smith cja[tmp] = row + oshift; 3107cee066cSHong Zhang } 3117cee066cSHong Zhang } 3129566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 313071fcb05SBarry Smith *ia = cia; 314071fcb05SBarry Smith *ja = cja; 3157cee066cSHong Zhang *spidx = cspidx; 3167cee066cSHong Zhang PetscFunctionReturn(0); 3177cee066cSHong Zhang } 3187cee066cSHong Zhang 319d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 320d71ae5a4SJacob Faibussowitsch { 3217cee066cSHong Zhang PetscFunctionBegin; 3229566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3239566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3247cee066cSHong Zhang PetscFunctionReturn(0); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 328d71ae5a4SJacob Faibussowitsch { 32987d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33087d4246cSBarry Smith PetscInt *ai = a->i; 331fff043a9SJunchao Zhang PetscScalar *aa; 33287d4246cSBarry Smith 33387d4246cSBarry Smith PetscFunctionBegin; 3349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3359566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 33787d4246cSBarry Smith PetscFunctionReturn(0); 33887d4246cSBarry Smith } 33987d4246cSBarry Smith 340bd04181cSBarry Smith /* 341bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 342bd04181cSBarry Smith 343bd04181cSBarry Smith - a single row of values is set with each call 344bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 345bd04181cSBarry Smith - the values are always added to the matrix, not set 346bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 347bd04181cSBarry Smith 3481f763a69SBarry Smith This does NOT assume the global column indices are sorted 349bd04181cSBarry Smith 3501f763a69SBarry Smith */ 351bd04181cSBarry Smith 352af0996ceSBarry Smith #include <petsc/private/isimpl.h> 353d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 354d71ae5a4SJacob Faibussowitsch { 355189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3561f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3571f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3581f763a69SBarry Smith PetscInt lastcol = -1; 359fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 360189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 361189e4007SBarry Smith 362fff043a9SJunchao Zhang PetscFunctionBegin; 3639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 364f38dd0b8SBarry Smith row = ridx[im[0]]; 3651f763a69SBarry Smith rp = aj + ai[row]; 3661f763a69SBarry Smith ap = aa + ai[row]; 3671f763a69SBarry Smith nrow = ailen[row]; 368189e4007SBarry Smith low = 0; 369189e4007SBarry Smith high = nrow; 370189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 371189e4007SBarry Smith col = cidx[in[l]]; 372f38dd0b8SBarry Smith value = v[l]; 373189e4007SBarry Smith 374189e4007SBarry Smith if (col <= lastcol) low = 0; 375189e4007SBarry Smith else high = nrow; 376189e4007SBarry Smith lastcol = col; 377189e4007SBarry Smith while (high - low > 5) { 378189e4007SBarry Smith t = (low + high) / 2; 379189e4007SBarry Smith if (rp[t] > col) high = t; 380189e4007SBarry Smith else low = t; 381189e4007SBarry Smith } 382189e4007SBarry Smith for (i = low; i < high; i++) { 383189e4007SBarry Smith if (rp[i] == col) { 3841f763a69SBarry Smith ap[i] += value; 385189e4007SBarry Smith low = i + 1; 3861f763a69SBarry Smith break; 387189e4007SBarry Smith } 388189e4007SBarry Smith } 389189e4007SBarry Smith } 3909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 391f38dd0b8SBarry Smith return 0; 392189e4007SBarry Smith } 393189e4007SBarry Smith 394d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 395d71ae5a4SJacob Faibussowitsch { 396416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 397e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 39897f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 399e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 400ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 401ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 402ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 40317ab2063SBarry Smith 4043a40ed3dSBarry Smith PetscFunctionBegin; 4059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 40617ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 407416022c9SBarry Smith row = im[k]; 4085ef9f2a5SBarry Smith if (row < 0) continue; 4096bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 410720833daSHong Zhang rp = aj + ai[row]; 411876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 4129371c9d4SSatish Balay rmax = imax[row]; 4139371c9d4SSatish Balay nrow = ailen[row]; 414416022c9SBarry Smith low = 0; 415c71e6ed7SBarry Smith high = nrow; 41617ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4175ef9f2a5SBarry Smith if (in[l] < 0) continue; 4186bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 419bfeeae90SHong Zhang col = in[l]; 420071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 421071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 42236db0b34SBarry Smith 4232205254eSKarl Rupp if (col <= lastcol) low = 0; 4242205254eSKarl Rupp else high = nrow; 425e2ee6c50SBarry Smith lastcol = col; 426416022c9SBarry Smith while (high - low > 5) { 427416022c9SBarry Smith t = (low + high) / 2; 428416022c9SBarry Smith if (rp[t] > col) high = t; 429416022c9SBarry Smith else low = t; 43017ab2063SBarry Smith } 431416022c9SBarry Smith for (i = low; i < high; i++) { 43217ab2063SBarry Smith if (rp[i] > col) break; 43317ab2063SBarry Smith if (rp[i] == col) { 434876c6284SHong Zhang if (!A->structure_only) { 4350c0d7e18SFande Kong if (is == ADD_VALUES) { 4360c0d7e18SFande Kong ap[i] += value; 4370c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4389371c9d4SSatish Balay } else ap[i] = value; 439720833daSHong Zhang } 440e44c0bd4SBarry Smith low = i + 1; 44117ab2063SBarry Smith goto noinsert; 44217ab2063SBarry Smith } 44317ab2063SBarry Smith } 444dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 445c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 44608401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 447720833daSHong Zhang if (A->structure_only) { 448876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 449720833daSHong Zhang } else { 450fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 451720833daSHong Zhang } 4529371c9d4SSatish Balay N = nrow++ - 1; 4539371c9d4SSatish Balay a->nz++; 4549371c9d4SSatish Balay high++; 455416022c9SBarry Smith /* shift up all the later entries in this row */ 4569566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 45717ab2063SBarry Smith rp[i] = col; 458580bdb30SBarry Smith if (!A->structure_only) { 4599566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 460580bdb30SBarry Smith ap[i] = value; 461580bdb30SBarry Smith } 462416022c9SBarry Smith low = i + 1; 463e56f5c9eSBarry Smith A->nonzerostate++; 464e44c0bd4SBarry Smith noinsert:; 46517ab2063SBarry Smith } 46617ab2063SBarry Smith ailen[row] = nrow; 46717ab2063SBarry Smith } 4689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4693a40ed3dSBarry Smith PetscFunctionReturn(0); 47017ab2063SBarry Smith } 47117ab2063SBarry Smith 472d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 473d71ae5a4SJacob Faibussowitsch { 47419b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 47519b08ed1SBarry Smith PetscInt *rp, k, row; 47619b08ed1SBarry Smith PetscInt *ai = a->i; 47719b08ed1SBarry Smith PetscInt *aj = a->j; 478fff043a9SJunchao Zhang MatScalar *aa, *ap; 47919b08ed1SBarry Smith 48019b08ed1SBarry Smith PetscFunctionBegin; 48128b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 48208401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 483fff043a9SJunchao Zhang 4849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 48519b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 48619b08ed1SBarry Smith row = im[k]; 48719b08ed1SBarry Smith rp = aj + ai[row]; 48819b08ed1SBarry Smith ap = aa + ai[row]; 48919b08ed1SBarry Smith 4909566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49119b08ed1SBarry Smith if (!A->structure_only) { 49219b08ed1SBarry Smith if (v) { 4939566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 49419b08ed1SBarry Smith v += n; 49519b08ed1SBarry Smith } else { 4969566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 49719b08ed1SBarry Smith } 49819b08ed1SBarry Smith } 49919b08ed1SBarry Smith a->ilen[row] = n; 50019b08ed1SBarry Smith a->imax[row] = n; 50119b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 50219b08ed1SBarry Smith a->nz += n; 50319b08ed1SBarry Smith } 5049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 50519b08ed1SBarry Smith PetscFunctionReturn(0); 50619b08ed1SBarry Smith } 50719b08ed1SBarry Smith 50819b08ed1SBarry Smith /*@ 50919b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51019b08ed1SBarry Smith 51119b08ed1SBarry Smith Input Parameters: 51211a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 51319b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 51419b08ed1SBarry Smith 51519b08ed1SBarry Smith Level: advanced 51619b08ed1SBarry Smith 51719b08ed1SBarry Smith Notes: 51819b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 51911a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52019b08ed1SBarry Smith as always with multiple matrix assemblies. 52119b08ed1SBarry Smith 522db781477SPatrick Sanan .seealso: `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 52319b08ed1SBarry Smith @*/ 52419b08ed1SBarry Smith 525d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 526d71ae5a4SJacob Faibussowitsch { 52719b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 52819b08ed1SBarry Smith 52919b08ed1SBarry Smith PetscFunctionBegin; 5309566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5319566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53219b08ed1SBarry Smith a->maxnz = nztotal; 5334dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 53419b08ed1SBarry Smith if (!a->ilen) { 5359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 53619b08ed1SBarry Smith } else { 5379566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 53819b08ed1SBarry Smith } 53919b08ed1SBarry Smith 54019b08ed1SBarry Smith /* allocate the matrix space */ 54119b08ed1SBarry Smith if (A->structure_only) { 5429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal, &a->j)); 5439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i)); 54419b08ed1SBarry Smith } else { 5459566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i)); 54619b08ed1SBarry Smith } 54719b08ed1SBarry Smith a->i[0] = 0; 54819b08ed1SBarry Smith if (A->structure_only) { 54919b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 55019b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55119b08ed1SBarry Smith } else { 55219b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 55319b08ed1SBarry Smith a->free_a = PETSC_TRUE; 55419b08ed1SBarry Smith } 55519b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 55619b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 55719b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 55819b08ed1SBarry Smith PetscFunctionReturn(0); 55919b08ed1SBarry Smith } 56019b08ed1SBarry Smith 561d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 562d71ae5a4SJacob Faibussowitsch { 563071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 564071fcb05SBarry Smith PetscInt *rp, k, row; 565071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 566071fcb05SBarry Smith PetscInt *aj = a->j; 567fff043a9SJunchao Zhang MatScalar *aa, *ap; 568071fcb05SBarry Smith 569071fcb05SBarry Smith PetscFunctionBegin; 5709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 571071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 572071fcb05SBarry Smith row = im[k]; 5736bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 574071fcb05SBarry Smith rp = aj + ai[row]; 575071fcb05SBarry Smith ap = aa + ai[row]; 57648a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 577071fcb05SBarry Smith if (!A->structure_only) { 578071fcb05SBarry Smith if (v) { 5799566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 580071fcb05SBarry Smith v += n; 581071fcb05SBarry Smith } else { 5829566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 583071fcb05SBarry Smith } 584071fcb05SBarry Smith } 585071fcb05SBarry Smith ailen[row] = n; 586071fcb05SBarry Smith a->nz += n; 587071fcb05SBarry Smith } 5889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 589071fcb05SBarry Smith PetscFunctionReturn(0); 590071fcb05SBarry Smith } 591071fcb05SBarry Smith 592d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 593d71ae5a4SJacob Faibussowitsch { 5947eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 59597f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59697f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 5974e208921SJed Brown const MatScalar *ap, *aa; 5987eb43aa7SLois Curfman McInnes 5993a40ed3dSBarry Smith PetscFunctionBegin; 6004e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6017eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6027eb43aa7SLois Curfman McInnes row = im[k]; 6039371c9d4SSatish Balay if (row < 0) { 6049371c9d4SSatish Balay v += n; 6059371c9d4SSatish Balay continue; 6069371c9d4SSatish Balay } /* negative row */ 60754c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6089371c9d4SSatish Balay rp = aj + ai[row]; 6099371c9d4SSatish Balay ap = aa + ai[row]; 6107eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6117eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6129371c9d4SSatish Balay if (in[l] < 0) { 6139371c9d4SSatish Balay v++; 6149371c9d4SSatish Balay continue; 6159371c9d4SSatish Balay } /* negative column */ 61654c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 617bfeeae90SHong Zhang col = in[l]; 6189371c9d4SSatish Balay high = nrow; 6199371c9d4SSatish Balay low = 0; /* assume unsorted */ 6207eb43aa7SLois Curfman McInnes while (high - low > 5) { 6217eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6227eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6237eb43aa7SLois Curfman McInnes else low = t; 6247eb43aa7SLois Curfman McInnes } 6257eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6267eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6277eb43aa7SLois Curfman McInnes if (rp[i] == col) { 628b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6297eb43aa7SLois Curfman McInnes goto finished; 6307eb43aa7SLois Curfman McInnes } 6317eb43aa7SLois Curfman McInnes } 63297e567efSBarry Smith *v++ = 0.0; 6337eb43aa7SLois Curfman McInnes finished:; 6347eb43aa7SLois Curfman McInnes } 6357eb43aa7SLois Curfman McInnes } 6364e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6373a40ed3dSBarry Smith PetscFunctionReturn(0); 6387eb43aa7SLois Curfman McInnes } 6397eb43aa7SLois Curfman McInnes 640d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 641d71ae5a4SJacob Faibussowitsch { 6423ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 643c898d852SStefano Zampini const PetscScalar *av; 6443ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6453ea6fe3dSLisandro Dalcin PetscInt *rowlens; 64617ab2063SBarry Smith 6473a40ed3dSBarry Smith PetscFunctionBegin; 6489566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6492205254eSKarl Rupp 6503ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6513ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6523ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6533ea6fe3dSLisandro Dalcin nz = A->nz; 654416022c9SBarry Smith 6553ea6fe3dSLisandro Dalcin /* write matrix header */ 6563ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6579371c9d4SSatish Balay header[1] = M; 6589371c9d4SSatish Balay header[2] = N; 6599371c9d4SSatish Balay header[3] = nz; 6609566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 661416022c9SBarry Smith 6623ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6643ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6659566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6669566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6673ea6fe3dSLisandro Dalcin /* store column indices */ 6689566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 669416022c9SBarry Smith /* store nonzero values */ 6709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6719566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 673b37d52dbSMark F. Adams 6743ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6759566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6763a40ed3dSBarry Smith PetscFunctionReturn(0); 67717ab2063SBarry Smith } 678416022c9SBarry Smith 679d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 680d71ae5a4SJacob Faibussowitsch { 6817dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6827dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6837dc0baabSHong Zhang 6847dc0baabSHong Zhang PetscFunctionBegin; 6859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6867dc0baabSHong Zhang for (i = 0; i < m; i++) { 6879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 68848a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6907dc0baabSHong Zhang } 6919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6927dc0baabSHong Zhang PetscFunctionReturn(0); 6937dc0baabSHong Zhang } 6947dc0baabSHong Zhang 69509573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 696cd155464SBarry Smith 697d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 698d71ae5a4SJacob Faibussowitsch { 699416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 700c898d852SStefano Zampini const PetscScalar *av; 70160e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 702e060cb09SBarry Smith const char *name; 703f3ef73ceSBarry Smith PetscViewerFormat format; 70417ab2063SBarry Smith 7053a40ed3dSBarry Smith PetscFunctionBegin; 7067dc0baabSHong Zhang if (A->structure_only) { 7079566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7087dc0baabSHong Zhang PetscFunctionReturn(0); 7097dc0baabSHong Zhang } 71043e49210SHong Zhang 7119566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 7122e5835c6SStefano Zampini if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 7132e5835c6SStefano Zampini 714c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 71771c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 71897f1f81fSBarry Smith PetscInt nofinalvalue = 0; 71960e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 720c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 721d00d2cf4SBarry Smith nofinalvalue = 1; 722d00d2cf4SBarry Smith } 7239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 726fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 728fbfe6fa7SJed Brown #else 7299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 730fbfe6fa7SJed Brown #endif 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73217ab2063SBarry Smith 73317ab2063SBarry Smith for (i = 0; i < m; i++) { 73460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 735aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 73717ab2063SBarry Smith #else 7389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 73917ab2063SBarry Smith #endif 74017ab2063SBarry Smith } 74117ab2063SBarry Smith } 742d00d2cf4SBarry Smith if (nofinalvalue) { 743c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 745c337ccceSJed Brown #else 7469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 747c337ccceSJed Brown #endif 748d00d2cf4SBarry Smith } 7499566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 752fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 75444cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 75660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 757aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 75836db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76036db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76236db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7646831982aSBarry Smith } 76544cd7ae7SLois Curfman McInnes #else 7669566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 76744cd7ae7SLois Curfman McInnes #endif 76844cd7ae7SLois Curfman McInnes } 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77044cd7ae7SLois Curfman McInnes } 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 772fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 77397f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 776496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 777496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 77860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 779496be53dSLois Curfman McInnes if (a->j[j] >= i) { 780aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78136db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 782496be53dSLois Curfman McInnes #else 783496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 784496be53dSLois Curfman McInnes #endif 785496be53dSLois Curfman McInnes } 786496be53dSLois Curfman McInnes } 787496be53dSLois Curfman McInnes } 7882e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7902e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7912205254eSKarl Rupp if (i + 4 < m) { 7929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 7932205254eSKarl Rupp } else if (i + 3 < m) { 7949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 7952205254eSKarl Rupp } else if (i + 2 < m) { 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 7972205254eSKarl Rupp } else if (i + 1 < m) { 7989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 7992205254eSKarl Rupp } else if (i < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8012205254eSKarl Rupp } else { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8032205254eSKarl Rupp } 804496be53dSLois Curfman McInnes } 8059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8069566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 807496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 80860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8099566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 810496be53dSLois Curfman McInnes } 8119566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 812496be53dSLois Curfman McInnes } 8139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 814496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 816496be53dSLois Curfman McInnes if (a->j[j] >= i) { 817aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 81848a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 819496be53dSLois Curfman McInnes #else 8209566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 821496be53dSLois Curfman McInnes #endif 822496be53dSLois Curfman McInnes } 823496be53dSLois Curfman McInnes } 8249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 825496be53dSLois Curfman McInnes } 8269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 827fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 82897f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 82987828ca2SBarry Smith PetscScalar value; 83068f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83168f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83268f1ed48SBarry Smith 83368f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 83468f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 83568f1ed48SBarry Smith realonly = PETSC_FALSE; 83668f1ed48SBarry Smith break; 83768f1ed48SBarry Smith } 83868f1ed48SBarry Smith } 83968f1ed48SBarry Smith #endif 84002594712SBarry Smith 8419566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84202594712SBarry Smith for (i = 0; i < m; i++) { 84302594712SBarry Smith jcnt = 0; 844d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 845e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 84602594712SBarry Smith value = a->a[cnt++]; 847e24b481bSBarry Smith jcnt++; 84802594712SBarry Smith } else { 84902594712SBarry Smith value = 0.0; 85002594712SBarry Smith } 851aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85268f1ed48SBarry Smith if (realonly) { 8539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 85468f1ed48SBarry Smith } else { 8559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 85668f1ed48SBarry Smith } 85702594712SBarry Smith #else 8589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 85902594712SBarry Smith #endif 86002594712SBarry Smith } 8619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86202594712SBarry Smith } 8639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8643c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 865150b93efSMatthew G. Knepley PetscInt fshift = 1; 8669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8673c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8693c215bfdSMatthew Knepley #else 8709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8713c215bfdSMatthew Knepley #endif 8729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8733c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 87460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8773c215bfdSMatthew Knepley #else 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8793c215bfdSMatthew Knepley #endif 8803c215bfdSMatthew Knepley } 8813c215bfdSMatthew Knepley } 8829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8833a40ed3dSBarry Smith } else { 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 885d5f3da31SBarry Smith if (A->factortype) { 88616cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 88816cd7e1dSShri Abhyankar /* L part */ 88960e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89116cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 89316cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 89516cd7e1dSShri Abhyankar } else { 8969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 89716cd7e1dSShri Abhyankar } 89816cd7e1dSShri Abhyankar #else 8999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90016cd7e1dSShri Abhyankar #endif 90116cd7e1dSShri Abhyankar } 90216cd7e1dSShri Abhyankar /* diagonal */ 90316cd7e1dSShri Abhyankar j = a->diag[i]; 90416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 90516cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 90716cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 90916cd7e1dSShri Abhyankar } else { 9109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91116cd7e1dSShri Abhyankar } 91216cd7e1dSShri Abhyankar #else 9139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 91416cd7e1dSShri Abhyankar #endif 91516cd7e1dSShri Abhyankar 91616cd7e1dSShri Abhyankar /* U part */ 91760e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 91816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9229566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 92316cd7e1dSShri Abhyankar } else { 9249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 92516cd7e1dSShri Abhyankar } 92616cd7e1dSShri Abhyankar #else 9279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 92816cd7e1dSShri Abhyankar #endif 92916cd7e1dSShri Abhyankar } 9309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93116cd7e1dSShri Abhyankar } 93216cd7e1dSShri Abhyankar } else { 93317ab2063SBarry Smith for (i = 0; i < m; i++) { 9349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 93560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 936aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 93736db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 93936db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9413a40ed3dSBarry Smith } else { 9429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 94317ab2063SBarry Smith } 94417ab2063SBarry Smith #else 9459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 94617ab2063SBarry Smith #endif 94717ab2063SBarry Smith } 9489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 94917ab2063SBarry Smith } 95016cd7e1dSShri Abhyankar } 9519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95217ab2063SBarry Smith } 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9543a40ed3dSBarry Smith PetscFunctionReturn(0); 955416022c9SBarry Smith } 956416022c9SBarry Smith 9579804daf3SBarry Smith #include <petscdraw.h> 958d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 959d71ae5a4SJacob Faibussowitsch { 960480ef9eaSBarry Smith Mat A = (Mat)Aa; 961416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 962383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 963383922c3SLisandro Dalcin int color; 964b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 965b0a32e0cSBarry Smith PetscViewer viewer; 966f3ef73ceSBarry Smith PetscViewerFormat format; 967fff043a9SJunchao Zhang const PetscScalar *aa; 968cddf8d76SBarry Smith 9693a40ed3dSBarry Smith PetscFunctionBegin; 9709566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9719566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9729566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 973383922c3SLisandro Dalcin 974416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 976fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 977d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9780513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 979b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 980416022c9SBarry Smith for (i = 0; i < m; i++) { 9819371c9d4SSatish Balay y_l = m - i - 1.0; 9829371c9d4SSatish Balay y_r = y_l + 1.0; 983bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9849371c9d4SSatish Balay x_l = a->j[j]; 9859371c9d4SSatish Balay x_r = x_l + 1.0; 986fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9879566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 988cddf8d76SBarry Smith } 989cddf8d76SBarry Smith } 990b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 991cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9929371c9d4SSatish Balay y_l = m - i - 1.0; 9939371c9d4SSatish Balay y_r = y_l + 1.0; 994bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9959371c9d4SSatish Balay x_l = a->j[j]; 9969371c9d4SSatish Balay x_r = x_l + 1.0; 997fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 9989566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 999cddf8d76SBarry Smith } 1000cddf8d76SBarry Smith } 1001b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1002cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10039371c9d4SSatish Balay y_l = m - i - 1.0; 10049371c9d4SSatish Balay y_r = y_l + 1.0; 1005bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10069371c9d4SSatish Balay x_l = a->j[j]; 10079371c9d4SSatish Balay x_r = x_l + 1.0; 1008fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10099566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1010416022c9SBarry Smith } 1011416022c9SBarry Smith } 1012d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10130513a670SBarry Smith } else { 10140513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10150513a670SBarry Smith /* first determine max of all nonzero values */ 1016b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1017383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1018b0a32e0cSBarry Smith PetscDraw popup; 10190513a670SBarry Smith 10200513a670SBarry Smith for (i = 0; i < nz; i++) { 1021fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10220513a670SBarry Smith } 1023383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10249566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10259566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1026383922c3SLisandro Dalcin 1027d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10280513a670SBarry Smith for (i = 0; i < m; i++) { 1029383922c3SLisandro Dalcin y_l = m - i - 1.0; 1030383922c3SLisandro Dalcin y_r = y_l + 1.0; 1031bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1032383922c3SLisandro Dalcin x_l = a->j[j]; 1033383922c3SLisandro Dalcin x_r = x_l + 1.0; 1034fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10359566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10360513a670SBarry Smith count++; 10370513a670SBarry Smith } 10380513a670SBarry Smith } 1039d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10400513a670SBarry Smith } 10419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1042480ef9eaSBarry Smith PetscFunctionReturn(0); 1043480ef9eaSBarry Smith } 1044cddf8d76SBarry Smith 10459804daf3SBarry Smith #include <petscdraw.h> 1046d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1047d71ae5a4SJacob Faibussowitsch { 1048b0a32e0cSBarry Smith PetscDraw draw; 104936db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1050ace3abfcSBarry Smith PetscBool isnull; 1051480ef9eaSBarry Smith 1052480ef9eaSBarry Smith PetscFunctionBegin; 10539566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10549566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 1055480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 1056480ef9eaSBarry Smith 10579371c9d4SSatish Balay xr = A->cmap->n; 10589371c9d4SSatish Balay yr = A->rmap->n; 10599371c9d4SSatish Balay h = yr / 10.0; 10609371c9d4SSatish Balay w = xr / 10.0; 10619371c9d4SSatish Balay xr += w; 10629371c9d4SSatish Balay yr += h; 10639371c9d4SSatish Balay xl = -w; 10649371c9d4SSatish Balay yl = -h; 10659566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10669566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10679566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10689566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10699566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10703a40ed3dSBarry Smith PetscFunctionReturn(0); 1071416022c9SBarry Smith } 1072416022c9SBarry Smith 1073d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1074d71ae5a4SJacob Faibussowitsch { 1075ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1076416022c9SBarry Smith 10773a40ed3dSBarry Smith PetscFunctionBegin; 10789566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10799566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10809566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10811baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10821baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10831baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10849566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10853a40ed3dSBarry Smith PetscFunctionReturn(0); 108617ab2063SBarry Smith } 108719bcc07fSBarry Smith 1088d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1089d71ae5a4SJacob Faibussowitsch { 1090416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1091580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1092d0f46423SBarry Smith PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0; 109354f21887SBarry Smith MatScalar *aa = a->a, *ap; 10943447b6efSHong Zhang PetscReal ratio = 0.6; 109517ab2063SBarry Smith 10963a40ed3dSBarry Smith PetscFunctionBegin; 10973a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 10989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1099b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1100b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11019566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 1102b215bc84SStefano Zampini PetscFunctionReturn(0); 1103b215bc84SStefano Zampini } 110417ab2063SBarry Smith 110543ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 110617ab2063SBarry Smith for (i = 1; i < m; i++) { 1107416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 110817ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 110994a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111017ab2063SBarry Smith if (fshift) { 1111bfeeae90SHong Zhang ip = aj + ai[i]; 1112bfeeae90SHong Zhang ap = aa + ai[i]; 111317ab2063SBarry Smith N = ailen[i]; 11149566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 111548a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 111617ab2063SBarry Smith } 111717ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 111817ab2063SBarry Smith } 111917ab2063SBarry Smith if (m) { 112017ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112117ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112217ab2063SBarry Smith } 11237b083b7cSBarry Smith 112417ab2063SBarry Smith /* reset ilen and imax for each row */ 11257b083b7cSBarry Smith a->nonzerorowcnt = 0; 1126396832f4SHong Zhang if (A->structure_only) { 11279566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11289566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1129396832f4SHong Zhang } else { /* !A->structure_only */ 113017ab2063SBarry Smith for (i = 0; i < m; i++) { 113117ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11327b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113317ab2063SBarry Smith } 1134396832f4SHong Zhang } 1135bfeeae90SHong Zhang a->nz = ai[m]; 1136aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 113717ab2063SBarry Smith 11389566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 11399566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11409566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11419566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11422205254eSKarl Rupp 11438e58a170SBarry Smith A->info.mallocs += a->reallocs; 1144dd5f02e7SSatish Balay a->reallocs = 0; 11456712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 114636db0b34SBarry Smith a->rmax = rmax; 11474e220ebcSLois Curfman McInnes 114848a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11499566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11503a40ed3dSBarry Smith PetscFunctionReturn(0); 115117ab2063SBarry Smith } 115217ab2063SBarry Smith 1153d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1154d71ae5a4SJacob Faibussowitsch { 115599cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 115699cafbc1SBarry Smith PetscInt i, nz = a->nz; 11572e5835c6SStefano Zampini MatScalar *aa; 115899cafbc1SBarry Smith 115999cafbc1SBarry Smith PetscFunctionBegin; 11609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 116199cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 116499cafbc1SBarry Smith PetscFunctionReturn(0); 116599cafbc1SBarry Smith } 116699cafbc1SBarry Smith 1167d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1168d71ae5a4SJacob Faibussowitsch { 116999cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 117099cafbc1SBarry Smith PetscInt i, nz = a->nz; 11712e5835c6SStefano Zampini MatScalar *aa; 117299cafbc1SBarry Smith 117399cafbc1SBarry Smith PetscFunctionBegin; 11749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117599cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 117899cafbc1SBarry Smith PetscFunctionReturn(0); 117999cafbc1SBarry Smith } 118099cafbc1SBarry Smith 1181d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1182d71ae5a4SJacob Faibussowitsch { 1183fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1184fff043a9SJunchao Zhang MatScalar *aa; 11853a40ed3dSBarry Smith 11863a40ed3dSBarry Smith PetscFunctionBegin; 11879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 11889566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 11899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 11909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11913a40ed3dSBarry Smith PetscFunctionReturn(0); 119217ab2063SBarry Smith } 1193416022c9SBarry Smith 1194d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatResetPreallocationCOO_SeqAIJ(Mat A) 1195d71ae5a4SJacob Faibussowitsch { 1196cbc6b225SStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1197cbc6b225SStefano Zampini 1198cbc6b225SStefano Zampini PetscFunctionBegin; 11999566063dSJacob Faibussowitsch PetscCall(PetscFree(a->perm)); 12009566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jmap)); 1201cbc6b225SStefano Zampini PetscFunctionReturn(0); 1202cbc6b225SStefano Zampini } 1203cbc6b225SStefano Zampini 1204d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1205d71ae5a4SJacob Faibussowitsch { 1206416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1207d5d45c9bSBarry Smith 12083a40ed3dSBarry Smith PetscFunctionBegin; 1209aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1210c0aa6a63SJacob Faibussowitsch PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz); 121117ab2063SBarry Smith #endif 12129566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12139566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(A)); 12149566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12159566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12169566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12179566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12189566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12199566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12209566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12219566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12229566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12239566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12259566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12269566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1228901853e0SKris Buschelman 12296718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12306718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12316718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12326718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12336718818eSStefano Zampini due to different matrix sizes */ 12349566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12356718818eSStefano Zampini 12369566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12372e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12382e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12452e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12462e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12472e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12482e956fe4SStefano Zampini #endif 12494222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12534222ddf1SHong Zhang #endif 12543d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12563d0639e7SStefano Zampini #endif 12579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1258af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1260af8000cdSHong Zhang #endif 1261d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1263d24d4204SJose E. Roman #endif 126463c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 126763c07aadSStefano Zampini #endif 12689566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12722e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12832e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12842e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12852e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12862e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 12872e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 12882e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 12892e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 12903a40ed3dSBarry Smith PetscFunctionReturn(0); 129117ab2063SBarry Smith } 129217ab2063SBarry Smith 1293d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1294d71ae5a4SJacob Faibussowitsch { 1295416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 12963a40ed3dSBarry Smith 12973a40ed3dSBarry Smith PetscFunctionBegin; 1298a65d3064SKris Buschelman switch (op) { 1299d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1300d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1301d71ae5a4SJacob Faibussowitsch break; 1302d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1303d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1304d71ae5a4SJacob Faibussowitsch break; 1305d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1306d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1307d71ae5a4SJacob Faibussowitsch break; 1308d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1309d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1310d71ae5a4SJacob Faibussowitsch break; 1311d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1312d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1313d71ae5a4SJacob Faibussowitsch break; 1314d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1315d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1316d71ae5a4SJacob Faibussowitsch break; 1317d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1318d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1319d71ae5a4SJacob Faibussowitsch break; 13203d472b54SHong Zhang case MAT_SPD: 1321b1646e73SJed Brown case MAT_SYMMETRIC: 1322b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1323b1646e73SJed Brown case MAT_HERMITIAN: 1324b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1325957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1326b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1327b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1328b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13295021d80fSJed Brown break; 13308c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1331a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1332d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1333d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1334d71ae5a4SJacob Faibussowitsch break; 1335d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1336d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1337d71ae5a4SJacob Faibussowitsch break; 1338d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1339d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1340d71ae5a4SJacob Faibussowitsch break; 1341071fcb05SBarry Smith case MAT_SORTED_FULL: 1342071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1343071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1344071fcb05SBarry Smith break; 1345d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1346d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1347d71ae5a4SJacob Faibussowitsch break; 1348d71ae5a4SJacob Faibussowitsch default: 1349d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1350a65d3064SKris Buschelman } 13513a40ed3dSBarry Smith PetscFunctionReturn(0); 135217ab2063SBarry Smith } 135317ab2063SBarry Smith 1354d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1355d71ae5a4SJacob Faibussowitsch { 1356416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1357fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1358c898d852SStefano Zampini PetscScalar *x; 1359c898d852SStefano Zampini const PetscScalar *aa; 136017ab2063SBarry Smith 13613a40ed3dSBarry Smith PetscFunctionBegin; 13629566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 136308401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1365d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1366d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13679566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13682c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13699566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 137135e7444dSHong Zhang PetscFunctionReturn(0); 137235e7444dSHong Zhang } 137335e7444dSHong Zhang 13749566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 137535e7444dSHong Zhang for (i = 0; i < n; i++) { 1376fdc842d1SBarry Smith x[i] = 0.0; 137735e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 137835e7444dSHong Zhang if (aj[j] == i) { 137935e7444dSHong Zhang x[i] = aa[j]; 138017ab2063SBarry Smith break; 138117ab2063SBarry Smith } 138217ab2063SBarry Smith } 138317ab2063SBarry Smith } 13849566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13863a40ed3dSBarry Smith PetscFunctionReturn(0); 138717ab2063SBarry Smith } 138817ab2063SBarry Smith 1389c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1390d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1391d71ae5a4SJacob Faibussowitsch { 1392416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13935f22a7b3SSebastian Grimberg const MatScalar *aa; 1394d9ca1df4SBarry Smith PetscScalar *y; 1395d9ca1df4SBarry Smith const PetscScalar *x; 1396d0f46423SBarry Smith PetscInt m = A->rmap->n; 13975c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 13985f22a7b3SSebastian Grimberg const MatScalar *v; 1399a77337e4SBarry Smith PetscScalar alpha; 1400d9ca1df4SBarry Smith PetscInt n, i, j; 1401d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14023447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1403ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14045c897100SBarry Smith #endif 140517ab2063SBarry Smith 14063a40ed3dSBarry Smith PetscFunctionBegin; 14079566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14089566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14099566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14115c897100SBarry Smith 14125c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1413fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14145c897100SBarry Smith #else 14153447b6efSHong Zhang if (usecprow) { 14163447b6efSHong Zhang m = cprow.nrows; 14173447b6efSHong Zhang ii = cprow.i; 14187b2bb3b9SHong Zhang ridx = cprow.rindex; 14193447b6efSHong Zhang } else { 14203447b6efSHong Zhang ii = a->i; 14213447b6efSHong Zhang } 142217ab2063SBarry Smith for (i = 0; i < m; i++) { 14233447b6efSHong Zhang idx = a->j + ii[i]; 1424fff043a9SJunchao Zhang v = aa + ii[i]; 14253447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14263447b6efSHong Zhang if (usecprow) { 14277b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14283447b6efSHong Zhang } else { 142917ab2063SBarry Smith alpha = x[i]; 14303447b6efSHong Zhang } 143104fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 143217ab2063SBarry Smith } 14335c897100SBarry Smith #endif 14349566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14359566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14369566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14383a40ed3dSBarry Smith PetscFunctionReturn(0); 143917ab2063SBarry Smith } 144017ab2063SBarry Smith 1441d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1442d71ae5a4SJacob Faibussowitsch { 14435c897100SBarry Smith PetscFunctionBegin; 14449566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14459566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14465c897100SBarry Smith PetscFunctionReturn(0); 14475c897100SBarry Smith } 14485c897100SBarry Smith 1449c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 145078b84d54SShri Abhyankar 1451d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1452d71ae5a4SJacob Faibussowitsch { 1453416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1454d9fead3dSBarry Smith PetscScalar *y; 145554f21887SBarry Smith const PetscScalar *x; 1456fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1457003131ecSBarry Smith PetscInt m = A->rmap->n; 14580298fd71SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 14597b083b7cSBarry Smith PetscInt n, i; 1460362ced78SSatish Balay PetscScalar sum; 1461ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 146217ab2063SBarry Smith 1463b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 146497952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1465fee21e36SBarry Smith #endif 1466fee21e36SBarry Smith 14673a40ed3dSBarry Smith PetscFunctionBegin; 1468b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14699566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 1470b215bc84SStefano Zampini PetscFunctionReturn(0); 1471b215bc84SStefano Zampini } 14729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14739566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14749566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1475416022c9SBarry Smith ii = a->i; 14764eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14779566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 147897952fefSHong Zhang m = a->compressedrow.nrows; 147997952fefSHong Zhang ii = a->compressedrow.i; 148097952fefSHong Zhang ridx = a->compressedrow.rindex; 148197952fefSHong Zhang for (i = 0; i < m; i++) { 148297952fefSHong Zhang n = ii[i + 1] - ii[i]; 148397952fefSHong Zhang aj = a->j + ii[i]; 1484fff043a9SJunchao Zhang aa = a_a + ii[i]; 148597952fefSHong Zhang sum = 0.0; 1486003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1487003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 148897952fefSHong Zhang y[*ridx++] = sum; 148997952fefSHong Zhang } 149097952fefSHong Zhang } else { /* do not use compressed row format */ 1491b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 14923d3eaba7SBarry Smith aj = a->j; 1493fff043a9SJunchao Zhang aa = a_a; 1494b05257ddSBarry Smith fortranmultaij_(&m, x, ii, aj, aa, y); 1495b05257ddSBarry Smith #else 149617ab2063SBarry Smith for (i = 0; i < m; i++) { 1497003131ecSBarry Smith n = ii[i + 1] - ii[i]; 1498003131ecSBarry Smith aj = a->j + ii[i]; 1499fff043a9SJunchao Zhang aa = a_a + ii[i]; 150017ab2063SBarry Smith sum = 0.0; 1501003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 150217ab2063SBarry Smith y[i] = sum; 150317ab2063SBarry Smith } 15048d195f9aSBarry Smith #endif 1505b05257ddSBarry Smith } 15069566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15079566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15089566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15103a40ed3dSBarry Smith PetscFunctionReturn(0); 151117ab2063SBarry Smith } 151217ab2063SBarry Smith 1513d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1514d71ae5a4SJacob Faibussowitsch { 1515b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1516b434eb95SMatthew G. Knepley PetscScalar *y; 1517b434eb95SMatthew G. Knepley const PetscScalar *x; 1518fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1519b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1520b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1521b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1522b434eb95SMatthew G. Knepley PetscScalar sum; 1523b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1524b434eb95SMatthew G. Knepley 1525b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1526b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1527b434eb95SMatthew G. Knepley #endif 1528b434eb95SMatthew G. Knepley 1529b434eb95SMatthew G. Knepley PetscFunctionBegin; 15309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15319566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15329566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1533b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1534b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1535b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1536b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1537b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1538b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1539b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1540fff043a9SJunchao Zhang aa = a_a + ii[i]; 1541b434eb95SMatthew G. Knepley sum = 0.0; 1542b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1543b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1544b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1545b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1546b434eb95SMatthew G. Knepley } 1547b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15483d3eaba7SBarry Smith ii = a->i; 1549b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1550b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1551b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1552fff043a9SJunchao Zhang aa = a_a + ii[i]; 1553b434eb95SMatthew G. Knepley sum = 0.0; 1554b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1555b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1556b434eb95SMatthew G. Knepley y[i] = sum; 1557b434eb95SMatthew G. Knepley } 1558b434eb95SMatthew G. Knepley } 15599566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15609566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15619566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 1563b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1564b434eb95SMatthew G. Knepley } 1565b434eb95SMatthew G. Knepley 1566d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1567d71ae5a4SJacob Faibussowitsch { 1568b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1569b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1570b434eb95SMatthew G. Knepley const PetscScalar *x; 1571fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1572b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1573b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1574b434eb95SMatthew G. Knepley PetscScalar sum; 1575b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1576b434eb95SMatthew G. Knepley 1577b434eb95SMatthew G. Knepley PetscFunctionBegin; 15789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15809566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1581b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 158248a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1583b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1584b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1585b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1586b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1587b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1588b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1589fff043a9SJunchao Zhang aa = a_a + ii[i]; 1590b434eb95SMatthew G. Knepley sum = y[*ridx]; 1591b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1592b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1593b434eb95SMatthew G. Knepley } 1594b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15953d3eaba7SBarry Smith ii = a->i; 1596b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1597b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1598b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1599fff043a9SJunchao Zhang aa = a_a + ii[i]; 1600b434eb95SMatthew G. Knepley sum = y[i]; 1601b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1602b434eb95SMatthew G. Knepley z[i] = sum; 1603b434eb95SMatthew G. Knepley } 1604b434eb95SMatthew G. Knepley } 16059566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16069566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16079566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 1609b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1610b434eb95SMatthew G. Knepley } 1611b434eb95SMatthew G. Knepley 1612c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1613d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1614d71ae5a4SJacob Faibussowitsch { 1615416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1616f15663dcSBarry Smith PetscScalar *y, *z; 1617f15663dcSBarry Smith const PetscScalar *x; 1618fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1619d9ca1df4SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 1620d9ca1df4SBarry Smith PetscInt m = A->rmap->n, n, i; 1621362ced78SSatish Balay PetscScalar sum; 1622ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16239ea0dfa2SSatish Balay 16243a40ed3dSBarry Smith PetscFunctionBegin; 1625b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16269566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 1627b215bc84SStefano Zampini PetscFunctionReturn(0); 1628b215bc84SStefano Zampini } 16299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16309566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16319566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16324eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 163348a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 163497952fefSHong Zhang m = a->compressedrow.nrows; 163597952fefSHong Zhang ii = a->compressedrow.i; 163697952fefSHong Zhang ridx = a->compressedrow.rindex; 163797952fefSHong Zhang for (i = 0; i < m; i++) { 163897952fefSHong Zhang n = ii[i + 1] - ii[i]; 163997952fefSHong Zhang aj = a->j + ii[i]; 1640fff043a9SJunchao Zhang aa = a_a + ii[i]; 164197952fefSHong Zhang sum = y[*ridx]; 1642f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 164397952fefSHong Zhang z[*ridx++] = sum; 164497952fefSHong Zhang } 164597952fefSHong Zhang } else { /* do not use compressed row format */ 16463d3eaba7SBarry Smith ii = a->i; 1647f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16483d3eaba7SBarry Smith aj = a->j; 1649fff043a9SJunchao Zhang aa = a_a; 1650f15663dcSBarry Smith fortranmultaddaij_(&m, x, ii, aj, aa, y, z); 1651f15663dcSBarry Smith #else 165217ab2063SBarry Smith for (i = 0; i < m; i++) { 1653f15663dcSBarry Smith n = ii[i + 1] - ii[i]; 1654f15663dcSBarry Smith aj = a->j + ii[i]; 1655fff043a9SJunchao Zhang aa = a_a + ii[i]; 165617ab2063SBarry Smith sum = y[i]; 1657f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165817ab2063SBarry Smith z[i] = sum; 165917ab2063SBarry Smith } 166002ab625aSSatish Balay #endif 1661f15663dcSBarry Smith } 16629566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16639566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16649566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16663a40ed3dSBarry Smith PetscFunctionReturn(0); 166717ab2063SBarry Smith } 166817ab2063SBarry Smith 166917ab2063SBarry Smith /* 167017ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 167117ab2063SBarry Smith */ 1672d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1673d71ae5a4SJacob Faibussowitsch { 1674416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1675d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1676c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 167717ab2063SBarry Smith 16783a40ed3dSBarry Smith PetscFunctionBegin; 167909f38230SBarry Smith if (!a->diag) { 16809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1681c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 168209f38230SBarry Smith } 1683d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1684c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1685c0c07093SJunchao Zhang if (alreadySet) { 1686c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1687c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1688c0c07093SJunchao Zhang } 1689c0c07093SJunchao Zhang 169009f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1691bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1692bfeeae90SHong Zhang if (a->j[j] == i) { 169309f38230SBarry Smith a->diag[i] = j; 169417ab2063SBarry Smith break; 169517ab2063SBarry Smith } 169617ab2063SBarry Smith } 169717ab2063SBarry Smith } 16983a40ed3dSBarry Smith PetscFunctionReturn(0); 169917ab2063SBarry Smith } 170017ab2063SBarry Smith 1701d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1702d71ae5a4SJacob Faibussowitsch { 170361ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 170461ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 170561ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 170661ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 170761ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 170861ecd0c6SBarry Smith 170961ecd0c6SBarry Smith PetscFunctionBegin; 171061ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17129566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 171361ecd0c6SBarry Smith PetscFunctionReturn(0); 171461ecd0c6SBarry Smith } 171561ecd0c6SBarry Smith 171661ecd0c6SBarry Smith if (a->diagonaldense) { 171761ecd0c6SBarry Smith cnt = 0; 171861ecd0c6SBarry Smith } else { 17199566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 172061ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1721349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 172261ecd0c6SBarry Smith cnt++; 172361ecd0c6SBarry Smith mdiag[i] = 1; 172461ecd0c6SBarry Smith } 172561ecd0c6SBarry Smith } 172661ecd0c6SBarry Smith } 172761ecd0c6SBarry Smith if (!cnt) { 17289566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 172961ecd0c6SBarry Smith } else { 1730b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1731b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 173261ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij; 173361ecd0c6SBarry Smith 173461ecd0c6SBarry Smith a->a = NULL; 173561ecd0c6SBarry Smith a->j = NULL; 173661ecd0c6SBarry Smith a->i = NULL; 173761ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1738ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 174061ecd0c6SBarry Smith 174161ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 174261ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17439566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 174448a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1745447d62f5SStefano Zampini } 17469566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17479566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 174861ecd0c6SBarry Smith if (singlemalloc) { 17499566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda, oldj, oldi)); 175061ecd0c6SBarry Smith } else { 17519566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17529566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17539566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 175461ecd0c6SBarry Smith } 175561ecd0c6SBarry Smith } 17569566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 175761ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 175861ecd0c6SBarry Smith PetscFunctionReturn(0); 175961ecd0c6SBarry Smith } 176061ecd0c6SBarry Smith 1761be5855fcSBarry Smith /* 1762be5855fcSBarry Smith Checks for missing diagonals 1763be5855fcSBarry Smith */ 1764d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1765d71ae5a4SJacob Faibussowitsch { 1766be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17677734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1768be5855fcSBarry Smith 1769be5855fcSBarry Smith PetscFunctionBegin; 177009f38230SBarry Smith *missing = PETSC_FALSE; 17717734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 177209f38230SBarry Smith *missing = PETSC_TRUE; 177309f38230SBarry Smith if (d) *d = 0; 17749566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 177509f38230SBarry Smith } else { 177601445905SHong Zhang PetscInt n; 177701445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1778f1e2ffcdSBarry Smith diag = a->diag; 177901445905SHong Zhang for (i = 0; i < n; i++) { 17807734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 178109f38230SBarry Smith *missing = PETSC_TRUE; 178209f38230SBarry Smith if (d) *d = i; 17839566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1784358d2f5dSShri Abhyankar break; 178509f38230SBarry Smith } 1786be5855fcSBarry Smith } 1787be5855fcSBarry Smith } 1788be5855fcSBarry Smith PetscFunctionReturn(0); 1789be5855fcSBarry Smith } 1790be5855fcSBarry Smith 17910da83c2eSBarry Smith #include <petscblaslapack.h> 17920da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 17930da83c2eSBarry Smith 17940da83c2eSBarry Smith /* 17950da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 17960da83c2eSBarry Smith */ 1797d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1798d71ae5a4SJacob Faibussowitsch { 17990da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18000da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18010da83c2eSBarry Smith const PetscReal shift = 0.0; 18020da83c2eSBarry Smith PetscInt ipvt[5]; 18034e208921SJed Brown PetscCount flops = 0; 18040da83c2eSBarry Smith PetscScalar work[25], *v_work; 18050da83c2eSBarry Smith 18060da83c2eSBarry Smith PetscFunctionBegin; 18070da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18080da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 180908401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1810ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 181248a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18130da83c2eSBarry Smith ncnt = 0; 18140da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18150da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18169566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18170da83c2eSBarry Smith switch (bsizes[i]) { 1818d71ae5a4SJacob Faibussowitsch case 1: 1819d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1820d71ae5a4SJacob Faibussowitsch break; 18210da83c2eSBarry Smith case 2: 18229566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18230da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18249566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18250da83c2eSBarry Smith break; 18260da83c2eSBarry Smith case 3: 18279566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18280da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18299566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18300da83c2eSBarry Smith break; 18310da83c2eSBarry Smith case 4: 18329566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18330da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18349566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18350da83c2eSBarry Smith break; 18360da83c2eSBarry Smith case 5: 18379566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18380da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18399566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18400da83c2eSBarry Smith break; 18410da83c2eSBarry Smith case 6: 18429566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18430da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18449566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18450da83c2eSBarry Smith break; 18460da83c2eSBarry Smith case 7: 18479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18480da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18499566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18500da83c2eSBarry Smith break; 18510da83c2eSBarry Smith default: 18529566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18530da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18549566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18550da83c2eSBarry Smith } 18560da83c2eSBarry Smith ncnt += bsizes[i]; 18570da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 18584e208921SJed Brown flops += 2 * PetscPowInt(bsizes[i], 3) / 3; 18590da83c2eSBarry Smith } 18604e208921SJed Brown PetscLogFlops(flops); 186148a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18629566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18630da83c2eSBarry Smith PetscFunctionReturn(0); 18640da83c2eSBarry Smith } 18650da83c2eSBarry Smith 1866422a814eSBarry Smith /* 1867422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1868422a814eSBarry Smith */ 1869d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1870d71ae5a4SJacob Faibussowitsch { 187171f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1872d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18732e5835c6SStefano Zampini const MatScalar *v; 187454f21887SBarry Smith PetscScalar *idiag, *mdiag; 187571f1c65dSBarry Smith 187671f1c65dSBarry Smith PetscFunctionBegin; 187771f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 18789566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 187971f1c65dSBarry Smith diag = a->diag; 18804dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18812e5835c6SStefano Zampini 188271f1c65dSBarry Smith mdiag = a->mdiag; 188371f1c65dSBarry Smith idiag = a->idiag; 18849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1885422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 188671f1c65dSBarry Smith for (i = 0; i < m; i++) { 188771f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1888899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1889899639b0SHong Zhang if (PetscRealPart(fshift)) { 18909566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 18917b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18927b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 18937b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 189498921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1895899639b0SHong Zhang } 189671f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 189771f1c65dSBarry Smith } 18989566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 189971f1c65dSBarry Smith } else { 190071f1c65dSBarry Smith for (i = 0; i < m; i++) { 190171f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 190271f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 190371f1c65dSBarry Smith } 19049566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 190571f1c65dSBarry Smith } 190671f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 190871f1c65dSBarry Smith PetscFunctionReturn(0); 190971f1c65dSBarry Smith } 191071f1c65dSBarry Smith 1911c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 1912d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1913d71ae5a4SJacob Faibussowitsch { 1914416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1915e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19162e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 191754f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19183d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 191997f1f81fSBarry Smith const PetscInt *idx, *diag; 192017ab2063SBarry Smith 19213a40ed3dSBarry Smith PetscFunctionBegin; 1922b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19239566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 1924b215bc84SStefano Zampini PetscFunctionReturn(0); 1925b215bc84SStefano Zampini } 1926b965ef7fSBarry Smith its = its * lits; 192791723122SBarry Smith 192871f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19299566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 193071f1c65dSBarry Smith a->fshift = fshift; 193171f1c65dSBarry Smith a->omega = omega; 1932ed480e8bSBarry Smith 193371f1c65dSBarry Smith diag = a->diag; 193471f1c65dSBarry Smith t = a->ssor_work; 1935ed480e8bSBarry Smith idiag = a->idiag; 193671f1c65dSBarry Smith mdiag = a->mdiag; 1937ed480e8bSBarry Smith 19389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19399566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19409566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1941ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 194217ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 194317ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1944ed480e8bSBarry Smith bs = b; 194517ab2063SBarry Smith for (i = 0; i < m; i++) { 194671f1c65dSBarry Smith d = fshift + mdiag[i]; 1947416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1948ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19492e5835c6SStefano Zampini v = aa + diag[i] + 1; 195017ab2063SBarry Smith sum = b[i] * d / omega; 1951003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 195217ab2063SBarry Smith x[i] = sum; 195317ab2063SBarry Smith } 19549566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19559566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19579566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19583a40ed3dSBarry Smith PetscFunctionReturn(0); 195917ab2063SBarry Smith } 1960c783ea89SBarry Smith 196108401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1962f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19634c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1964887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 196517ab2063SBarry Smith 196617ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 196717ab2063SBarry Smith 1968887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 196917ab2063SBarry Smith */ 197017ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 197117ab2063SBarry Smith 197217ab2063SBarry Smith /* x = (E + U)^{-1} b */ 197317ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1974416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1975ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19762e5835c6SStefano Zampini v = aa + diag[i] + 1; 197717ab2063SBarry Smith sum = b[i]; 1978e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1979ed480e8bSBarry Smith x[i] = sum * idiag[i]; 198017ab2063SBarry Smith } 198117ab2063SBarry Smith 198217ab2063SBarry Smith /* t = b - (2*E - D)x */ 19832e5835c6SStefano Zampini v = aa; 19842205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 198517ab2063SBarry Smith 198617ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1987ed480e8bSBarry Smith ts = t; 1988416022c9SBarry Smith diag = a->diag; 198917ab2063SBarry Smith for (i = 0; i < m; i++) { 1990416022c9SBarry Smith n = diag[i] - a->i[i]; 1991ed480e8bSBarry Smith idx = a->j + a->i[i]; 19922e5835c6SStefano Zampini v = aa + a->i[i]; 199317ab2063SBarry Smith sum = t[i]; 1994003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 1995ed480e8bSBarry Smith t[i] = sum * idiag[i]; 1996733d66baSBarry Smith /* x = x + t */ 1997733d66baSBarry Smith x[i] += t[i]; 199817ab2063SBarry Smith } 199917ab2063SBarry Smith 20009566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20019566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20029566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20033a40ed3dSBarry Smith PetscFunctionReturn(0); 200417ab2063SBarry Smith } 200517ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 200617ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 200717ab2063SBarry Smith for (i = 0; i < m; i++) { 2008416022c9SBarry Smith n = diag[i] - a->i[i]; 2009ed480e8bSBarry Smith idx = a->j + a->i[i]; 20102e5835c6SStefano Zampini v = aa + a->i[i]; 201117ab2063SBarry Smith sum = b[i]; 2012e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20135c99c7daSBarry Smith t[i] = sum; 2014ed480e8bSBarry Smith x[i] = sum * idiag[i]; 201517ab2063SBarry Smith } 20165c99c7daSBarry Smith xb = t; 20179566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20183a40ed3dSBarry Smith } else xb = b; 201917ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 202017ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2021416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2022ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20232e5835c6SStefano Zampini v = aa + diag[i] + 1; 202417ab2063SBarry Smith sum = xb[i]; 2025e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20265c99c7daSBarry Smith if (xb == b) { 2027ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20285c99c7daSBarry Smith } else { 2029b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 203017ab2063SBarry Smith } 20315c99c7daSBarry Smith } 20329566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 203317ab2063SBarry Smith } 203417ab2063SBarry Smith its--; 203517ab2063SBarry Smith } 203617ab2063SBarry Smith while (its--) { 203717ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 203817ab2063SBarry Smith for (i = 0; i < m; i++) { 2039b19a5dc2SMark Adams /* lower */ 2040b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2041ed480e8bSBarry Smith idx = a->j + a->i[i]; 20422e5835c6SStefano Zampini v = aa + a->i[i]; 204317ab2063SBarry Smith sum = b[i]; 2044e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2045b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2046b19a5dc2SMark Adams /* upper */ 2047b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2048b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20492e5835c6SStefano Zampini v = aa + diag[i] + 1; 2050b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2051b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 205217ab2063SBarry Smith } 2053b19a5dc2SMark Adams xb = t; 20549566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2055b19a5dc2SMark Adams } else xb = b; 205617ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 205717ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2058b19a5dc2SMark Adams sum = xb[i]; 2059b19a5dc2SMark Adams if (xb == b) { 2060b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2061416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2062ed480e8bSBarry Smith idx = a->j + a->i[i]; 20632e5835c6SStefano Zampini v = aa + a->i[i]; 2064e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2065ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2066b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2067b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2068b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20692e5835c6SStefano Zampini v = aa + diag[i] + 1; 2070b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2071b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 207217ab2063SBarry Smith } 2073b19a5dc2SMark Adams } 2074b19a5dc2SMark Adams if (xb == b) { 20759566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2076b19a5dc2SMark Adams } else { 20779566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2078b19a5dc2SMark Adams } 207917ab2063SBarry Smith } 208017ab2063SBarry Smith } 20819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20829566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20839566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 2084365a8a9eSBarry Smith PetscFunctionReturn(0); 208517ab2063SBarry Smith } 208617ab2063SBarry Smith 2087d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2088d71ae5a4SJacob Faibussowitsch { 2089416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 20904e220ebcSLois Curfman McInnes 20913a40ed3dSBarry Smith PetscFunctionBegin; 20924e220ebcSLois Curfman McInnes info->block_size = 1.0; 20933966268fSBarry Smith info->nz_allocated = a->maxnz; 20943966268fSBarry Smith info->nz_used = a->nz; 20953966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 20963966268fSBarry Smith info->assemblies = A->num_ass; 20973966268fSBarry Smith info->mallocs = A->info.mallocs; 20984dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2099d5f3da31SBarry Smith if (A->factortype) { 21004e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21014e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21024e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21034e220ebcSLois Curfman McInnes } else { 21044e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21054e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21064e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21074e220ebcSLois Curfman McInnes } 21083a40ed3dSBarry Smith PetscFunctionReturn(0); 210917ab2063SBarry Smith } 211017ab2063SBarry Smith 2111d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2112d71ae5a4SJacob Faibussowitsch { 2113416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2114c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 211597b48c8fSBarry Smith const PetscScalar *xx; 21162e5835c6SStefano Zampini PetscScalar *bb, *aa; 2117c7da8527SEric Chamberland PetscInt d = 0; 211817ab2063SBarry Smith 21193a40ed3dSBarry Smith PetscFunctionBegin; 212097b48c8fSBarry Smith if (x && b) { 21219566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21229566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 212397b48c8fSBarry Smith for (i = 0; i < N; i++) { 2124aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2125447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 212697b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 212797b48c8fSBarry Smith } 21289566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21299566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 213097b48c8fSBarry Smith } 213197b48c8fSBarry Smith 21329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2133a9817697SBarry Smith if (a->keepnonzeropattern) { 2134f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2135aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21369566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2137f1e2ffcdSBarry Smith } 2138f4df32b1SMatthew Knepley if (diag != 0.0) { 2139c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2140c7da8527SEric Chamberland d = rows[i]; 2141447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 214208401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2143c7da8527SEric Chamberland } 2144f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2145447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21462e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2147f1e2ffcdSBarry Smith } 2148f1e2ffcdSBarry Smith } 2149f1e2ffcdSBarry Smith } else { 2150f4df32b1SMatthew Knepley if (diag != 0.0) { 215117ab2063SBarry Smith for (i = 0; i < N; i++) { 2152aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21537ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2154447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2155447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2156447d62f5SStefano Zampini } else { 2157416022c9SBarry Smith a->ilen[rows[i]] = 1; 21582e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2159bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2160447d62f5SStefano Zampini } 2161447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21629566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 216317ab2063SBarry Smith } 216417ab2063SBarry Smith } 21653a40ed3dSBarry Smith } else { 216617ab2063SBarry Smith for (i = 0; i < N; i++) { 2167aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2168416022c9SBarry Smith a->ilen[rows[i]] = 0; 216917ab2063SBarry Smith } 217017ab2063SBarry Smith } 2171e56f5c9eSBarry Smith A->nonzerostate++; 2172f1e2ffcdSBarry Smith } 21739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2174dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21753a40ed3dSBarry Smith PetscFunctionReturn(0); 217617ab2063SBarry Smith } 217717ab2063SBarry Smith 2178d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2179d71ae5a4SJacob Faibussowitsch { 21806e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21816e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21822b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 21836e169961SBarry Smith const PetscScalar *xx; 21842e5835c6SStefano Zampini PetscScalar *bb, *aa; 21856e169961SBarry Smith 21866e169961SBarry Smith PetscFunctionBegin; 21872e5835c6SStefano Zampini if (!N) PetscFunctionReturn(0); 21889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 21896e169961SBarry Smith if (x && b) { 21909566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21919566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 21922b40b63fSBarry Smith vecs = PETSC_TRUE; 21936e169961SBarry Smith } 21949566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 21956e169961SBarry Smith for (i = 0; i < N; i++) { 2196aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21979566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 21982205254eSKarl Rupp 21996e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22006e169961SBarry Smith } 22016e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22026e169961SBarry Smith if (!zeroed[i]) { 22036e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22044cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22052e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22062e5835c6SStefano Zampini aa[j] = 0.0; 22076e169961SBarry Smith } 22086e169961SBarry Smith } 22094cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22106e169961SBarry Smith } 22116e169961SBarry Smith if (x && b) { 22129566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22139566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22146e169961SBarry Smith } 22159566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22166e169961SBarry Smith if (diag != 0.0) { 22179566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22181d5a398dSstefano_zampini if (missing) { 22191d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22204cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2221aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22229566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22231d5a398dSstefano_zampini } 22241d5a398dSstefano_zampini } else { 2225ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22266e169961SBarry Smith } 22271d5a398dSstefano_zampini } 22289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2229dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22306e169961SBarry Smith PetscFunctionReturn(0); 22316e169961SBarry Smith } 22326e169961SBarry Smith 2233d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2234d71ae5a4SJacob Faibussowitsch { 2235fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2236fff043a9SJunchao Zhang const PetscScalar *aa; 2237fff043a9SJunchao Zhang PetscInt *itmp; 223817ab2063SBarry Smith 22393a40ed3dSBarry Smith PetscFunctionBegin; 22409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2241416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22422e5835c6SStefano Zampini if (v) *v = (PetscScalar *)(aa + a->i[row]); 224317ab2063SBarry Smith if (idx) { 2244bfeeae90SHong Zhang itmp = a->j + a->i[row]; 224526fbe8dcSKarl Rupp if (*nz) *idx = itmp; 2246f4259b30SLisandro Dalcin else *idx = NULL; 224717ab2063SBarry Smith } 22489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22493a40ed3dSBarry Smith PetscFunctionReturn(0); 225017ab2063SBarry Smith } 225117ab2063SBarry Smith 2252d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2253d71ae5a4SJacob Faibussowitsch { 22543a40ed3dSBarry Smith PetscFunctionBegin; 2255cb4a9cd9SHong Zhang if (nz) *nz = 0; 22562e5835c6SStefano Zampini if (idx) *idx = NULL; 22572e5835c6SStefano Zampini if (v) *v = NULL; 22583a40ed3dSBarry Smith PetscFunctionReturn(0); 225917ab2063SBarry Smith } 226017ab2063SBarry Smith 2261d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2262d71ae5a4SJacob Faibussowitsch { 2263416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22642e5835c6SStefano Zampini const MatScalar *v; 226536db0b34SBarry Smith PetscReal sum = 0.0; 226697f1f81fSBarry Smith PetscInt i, j; 226717ab2063SBarry Smith 22683a40ed3dSBarry Smith PetscFunctionBegin; 22699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 227017ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2271570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2272570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2273792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2274570b7f6dSBarry Smith #else 2275416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22769371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22779371c9d4SSatish Balay v++; 227817ab2063SBarry Smith } 22798f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2280570b7f6dSBarry Smith #endif 22819566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22823a40ed3dSBarry Smith } else if (type == NORM_1) { 228336db0b34SBarry Smith PetscReal *tmp; 228497f1f81fSBarry Smith PetscInt *jj = a->j; 22859566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2286064f8208SBarry Smith *nrm = 0.0; 2287416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 22889371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 22899371c9d4SSatish Balay v++; 229017ab2063SBarry Smith } 2291d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2292064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 229317ab2063SBarry Smith } 22949566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 22959566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 22963a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2297064f8208SBarry Smith *nrm = 0.0; 2298d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 22992e5835c6SStefano Zampini const PetscScalar *v2 = v + a->i[j]; 230017ab2063SBarry Smith sum = 0.0; 2301416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23029371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23039371c9d4SSatish Balay v2++; 230417ab2063SBarry Smith } 2305064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 230617ab2063SBarry Smith } 23079566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2308f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23103a40ed3dSBarry Smith PetscFunctionReturn(0); 231117ab2063SBarry Smith } 231217ab2063SBarry Smith 2313d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2314d71ae5a4SJacob Faibussowitsch { 23153d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 231654f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23172e5835c6SStefano Zampini const MatScalar *va, *vb; 231897f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2319cd0d46ebSvictorle 2320cd0d46ebSvictorle PetscFunctionBegin; 23219566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23229566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23235485867bSBarry Smith if (ma != nb || na != mb) { 23245485867bSBarry Smith *f = PETSC_FALSE; 23255485867bSBarry Smith PetscFunctionReturn(0); 23265485867bSBarry Smith } 23279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23299371c9d4SSatish Balay aii = aij->i; 23309371c9d4SSatish Balay bii = bij->i; 23319371c9d4SSatish Balay adx = aij->j; 23329371c9d4SSatish Balay bdx = bij->j; 23339566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23349566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2335cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2336cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2337cd0d46ebSvictorle 2338cd0d46ebSvictorle *f = PETSC_TRUE; 2339cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2340cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 234197f1f81fSBarry Smith PetscInt idc, idr; 23425485867bSBarry Smith PetscScalar vc, vr; 2343cd0d46ebSvictorle /* column/row index/value */ 23445485867bSBarry Smith idc = adx[aptr[i]]; 23455485867bSBarry Smith idr = bdx[bptr[idc]]; 23465485867bSBarry Smith vc = va[aptr[i]]; 23475485867bSBarry Smith vr = vb[bptr[idc]]; 23485485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23495485867bSBarry Smith *f = PETSC_FALSE; 23505485867bSBarry Smith goto done; 2351cd0d46ebSvictorle } else { 23525485867bSBarry Smith aptr[i]++; 23535485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2354cd0d46ebSvictorle } 2355cd0d46ebSvictorle } 2356cd0d46ebSvictorle } 2357cd0d46ebSvictorle done: 23589566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23599566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 2362cd0d46ebSvictorle PetscFunctionReturn(0); 2363cd0d46ebSvictorle } 2364cd0d46ebSvictorle 2365d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2366d71ae5a4SJacob Faibussowitsch { 23673d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 236854f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 236954f21887SBarry Smith MatScalar *va, *vb; 23701cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23711cbb95d3SBarry Smith 23721cbb95d3SBarry Smith PetscFunctionBegin; 23739566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23749566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23751cbb95d3SBarry Smith if (ma != nb || na != mb) { 23761cbb95d3SBarry Smith *f = PETSC_FALSE; 23771cbb95d3SBarry Smith PetscFunctionReturn(0); 23781cbb95d3SBarry Smith } 23799371c9d4SSatish Balay aii = aij->i; 23809371c9d4SSatish Balay bii = bij->i; 23819371c9d4SSatish Balay adx = aij->j; 23829371c9d4SSatish Balay bdx = bij->j; 23839371c9d4SSatish Balay va = aij->a; 23849371c9d4SSatish Balay vb = bij->a; 23859566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23869566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23871cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 23881cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 23891cbb95d3SBarry Smith 23901cbb95d3SBarry Smith *f = PETSC_TRUE; 23911cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 23921cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 23931cbb95d3SBarry Smith PetscInt idc, idr; 23941cbb95d3SBarry Smith PetscScalar vc, vr; 23951cbb95d3SBarry Smith /* column/row index/value */ 23961cbb95d3SBarry Smith idc = adx[aptr[i]]; 23971cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 23981cbb95d3SBarry Smith vc = va[aptr[i]]; 23991cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24001cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24011cbb95d3SBarry Smith *f = PETSC_FALSE; 24021cbb95d3SBarry Smith goto done; 24031cbb95d3SBarry Smith } else { 24041cbb95d3SBarry Smith aptr[i]++; 24051cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24061cbb95d3SBarry Smith } 24071cbb95d3SBarry Smith } 24081cbb95d3SBarry Smith } 24091cbb95d3SBarry Smith done: 24109566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24119566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24121cbb95d3SBarry Smith PetscFunctionReturn(0); 24131cbb95d3SBarry Smith } 24141cbb95d3SBarry Smith 2415d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2416d71ae5a4SJacob Faibussowitsch { 24179e29f15eSvictorle PetscFunctionBegin; 24189566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f)); 24199e29f15eSvictorle PetscFunctionReturn(0); 24209e29f15eSvictorle } 24219e29f15eSvictorle 2422d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2423d71ae5a4SJacob Faibussowitsch { 24241cbb95d3SBarry Smith PetscFunctionBegin; 24259566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f)); 24261cbb95d3SBarry Smith PetscFunctionReturn(0); 24271cbb95d3SBarry Smith } 24281cbb95d3SBarry Smith 2429d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2430d71ae5a4SJacob Faibussowitsch { 2431416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2432fff8e43fSBarry Smith const PetscScalar *l, *r; 2433fff8e43fSBarry Smith PetscScalar x; 243454f21887SBarry Smith MatScalar *v; 2435fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2436fff8e43fSBarry Smith const PetscInt *jj; 243717ab2063SBarry Smith 24383a40ed3dSBarry Smith PetscFunctionBegin; 243917ab2063SBarry Smith if (ll) { 24403ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24413ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24429566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 244308401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24449566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 244617ab2063SBarry Smith for (i = 0; i < m; i++) { 244717ab2063SBarry Smith x = l[i]; 2448416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24492205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 245017ab2063SBarry Smith } 24519566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24529566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 245417ab2063SBarry Smith } 245517ab2063SBarry Smith if (rr) { 24569566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 245708401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24589566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24602e5835c6SStefano Zampini jj = a->j; 24612205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24639566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24649566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 246517ab2063SBarry Smith } 24669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24673a40ed3dSBarry Smith PetscFunctionReturn(0); 246817ab2063SBarry Smith } 246917ab2063SBarry Smith 2470d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2471d71ae5a4SJacob Faibussowitsch { 2472db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2473d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 247497f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24755d0c19d7SBarry Smith const PetscInt *irow, *icol; 24762e5835c6SStefano Zampini const PetscScalar *aa; 24775d0c19d7SBarry Smith PetscInt nrows, ncols; 247897f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 2479*fb3c7e2dSJunchao Zhang MatScalar *a_new, *mat_a, *c_a; 2480416022c9SBarry Smith Mat C; 2481cdc6f3adSToby Isaac PetscBool stride; 248217ab2063SBarry Smith 24833a40ed3dSBarry Smith PetscFunctionBegin; 24849566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24859566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24869566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 248717ab2063SBarry Smith 24889566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2489ff718158SBarry Smith if (stride) { 24909566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2491ff718158SBarry Smith } else { 2492ff718158SBarry Smith first = 0; 2493ff718158SBarry Smith step = 0; 2494ff718158SBarry Smith } 2495fee21e36SBarry Smith if (stride && step == 1) { 249602834360SBarry Smith /* special case of contiguous rows */ 24979566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 249802834360SBarry Smith /* loop over new rows determining lens and starting points */ 249902834360SBarry Smith for (i = 0; i < nrows; i++) { 2500bfeeae90SHong Zhang kstart = ai[irow[i]]; 2501a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2502a91a9bebSLisandro Dalcin starts[i] = kstart; 250302834360SBarry Smith for (k = kstart; k < kend; k++) { 2504bfeeae90SHong Zhang if (aj[k] >= first) { 250502834360SBarry Smith starts[i] = k; 250602834360SBarry Smith break; 250702834360SBarry Smith } 250802834360SBarry Smith } 2509a2744918SBarry Smith sum = 0; 251002834360SBarry Smith while (k < kend) { 2511bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2512a2744918SBarry Smith sum++; 251302834360SBarry Smith } 2514a2744918SBarry Smith lens[i] = sum; 251502834360SBarry Smith } 251602834360SBarry Smith /* create submatrix */ 2517cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 251897f1f81fSBarry Smith PetscInt n_cols, n_rows; 25199566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2520aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25219566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 252208480c60SBarry Smith C = *B; 25233a40ed3dSBarry Smith } else { 25243bef6203SJed Brown PetscInt rbs, cbs; 25259566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25269566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25279566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25289566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25299566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25309566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 253208480c60SBarry Smith } 2533db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2534db02288aSLois Curfman McInnes 253502834360SBarry Smith /* loop over rows inserting into submatrix */ 2536*fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C 2537db02288aSLois Curfman McInnes j_new = c->j; 2538db02288aSLois Curfman McInnes i_new = c->i; 25399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 254002834360SBarry Smith for (i = 0; i < nrows; i++) { 2541a2744918SBarry Smith ii = starts[i]; 2542a2744918SBarry Smith lensi = lens[i]; 2543ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25449566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2545a2744918SBarry Smith a_new += lensi; 2546a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2547a2744918SBarry Smith c->ilen[i] = lensi; 254802834360SBarry Smith } 2549*fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly 25509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25519566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25523a40ed3dSBarry Smith } else { 25539566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25549566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25559566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25564dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25576bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25584dcab191SBarry Smith smap[icol[i]] = i + 1; 25594dcab191SBarry Smith } 25604dcab191SBarry Smith 256102834360SBarry Smith /* determine lens of each row */ 256202834360SBarry Smith for (i = 0; i < nrows; i++) { 2563bfeeae90SHong Zhang kstart = ai[irow[i]]; 256402834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 256502834360SBarry Smith lens[i] = 0; 256602834360SBarry Smith for (k = kstart; k < kend; k++) { 2567ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 256802834360SBarry Smith } 256902834360SBarry Smith } 257017ab2063SBarry Smith /* Create and fill new matrix */ 2571a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2572ace3abfcSBarry Smith PetscBool equal; 25730f5bd95cSBarry Smith 257499141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2575aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25769566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 257728b400f6SJacob Faibussowitsch PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong no of nonzeros"); 25789566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 257908480c60SBarry Smith C = *B; 25803a40ed3dSBarry Smith } else { 25813bef6203SJed Brown PetscInt rbs, cbs; 25829566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25839566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25849566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25859566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25869566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25879566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 258908480c60SBarry Smith } 25909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2591*fb3c7e2dSJunchao Zhang 259299141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 2593*fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C 259417ab2063SBarry Smith for (i = 0; i < nrows; i++) { 259599141d43SSatish Balay row = irow[i]; 2596bfeeae90SHong Zhang kstart = ai[row]; 259799141d43SSatish Balay kend = kstart + a->ilen[row]; 2598bfeeae90SHong Zhang mat_i = c->i[i]; 259999141d43SSatish Balay mat_j = c->j + mat_i; 2600*fb3c7e2dSJunchao Zhang mat_a = c_a + mat_i; 260199141d43SSatish Balay mat_ilen = c->ilen + i; 260217ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2603bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2604ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26052e5835c6SStefano Zampini *mat_a++ = aa[k]; 260699141d43SSatish Balay (*mat_ilen)++; 260717ab2063SBarry Smith } 260817ab2063SBarry Smith } 260917ab2063SBarry Smith } 26109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 261102834360SBarry Smith /* Free work space */ 26129566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26139566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26149566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2615cdc6f3adSToby Isaac /* sort */ 2616cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2617cdc6f3adSToby Isaac PetscInt ilen; 2618cdc6f3adSToby Isaac 2619cdc6f3adSToby Isaac mat_i = c->i[i]; 2620cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2621*fb3c7e2dSJunchao Zhang mat_a = c_a + mat_i; 2622cdc6f3adSToby Isaac ilen = c->ilen[i]; 26239566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2624cdc6f3adSToby Isaac } 2625*fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a)); 262602834360SBarry Smith } 26278c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26289566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2629305c6ccfSStefano Zampini #endif 26309566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26319566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 263217ab2063SBarry Smith 26339566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2634416022c9SBarry Smith *B = C; 26353a40ed3dSBarry Smith PetscFunctionReturn(0); 263617ab2063SBarry Smith } 263717ab2063SBarry Smith 2638d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2639d71ae5a4SJacob Faibussowitsch { 264082d44351SHong Zhang Mat B; 264182d44351SHong Zhang 264282d44351SHong Zhang PetscFunctionBegin; 2643c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26449566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26459566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26469566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26479566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26489566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 264982d44351SHong Zhang *subMat = B; 2650c2d650bdSHong Zhang } else { 26519566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2652c2d650bdSHong Zhang } 265382d44351SHong Zhang PetscFunctionReturn(0); 265482d44351SHong Zhang } 265582d44351SHong Zhang 2656d71ae5a4SJacob Faibussowitsch PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2657d71ae5a4SJacob Faibussowitsch { 265863b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 265963b91edcSBarry Smith Mat outA; 2660ace3abfcSBarry Smith PetscBool row_identity, col_identity; 266163b91edcSBarry Smith 26623a40ed3dSBarry Smith PetscFunctionBegin; 266308401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26641df811f5SHong Zhang 26659566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26669566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2667a871dcd8SBarry Smith 266863b91edcSBarry Smith outA = inA; 2669d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26709566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26719566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26722205254eSKarl Rupp 26739566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26749566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26752205254eSKarl Rupp 2676c3122656SLisandro Dalcin a->row = row; 26772205254eSKarl Rupp 26789566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26799566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26802205254eSKarl Rupp 2681c3122656SLisandro Dalcin a->col = col; 268263b91edcSBarry Smith 268336db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26849566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26859566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2686f0ec6fceSSatish Balay 268794a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26889566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 268994a9d846SBarry Smith } 269063b91edcSBarry Smith 26919566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2692137fb511SHong Zhang if (row_identity && col_identity) { 26939566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2694137fb511SHong Zhang } else { 26959566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2696137fb511SHong Zhang } 26973a40ed3dSBarry Smith PetscFunctionReturn(0); 2698a871dcd8SBarry Smith } 2699a871dcd8SBarry Smith 2700d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2701d71ae5a4SJacob Faibussowitsch { 2702f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2703dfa0f9e5SStefano Zampini PetscScalar *v; 2704c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 27053a40ed3dSBarry Smith 27063a40ed3dSBarry Smith PetscFunctionBegin; 27079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27089566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2709792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27109566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27133a40ed3dSBarry Smith PetscFunctionReturn(0); 2714f0b747eeSBarry Smith } 2715f0b747eeSBarry Smith 2716d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2717d71ae5a4SJacob Faibussowitsch { 271816b64355SHong Zhang PetscInt i; 271916b64355SHong Zhang 272016b64355SHong Zhang PetscFunctionBegin; 272116b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27229566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 272316b64355SHong Zhang 272448a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27259566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 272616b64355SHong Zhang 272716b64355SHong Zhang if (submatj->rbuf1) { 27289566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27299566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 273016b64355SHong Zhang } 273116b64355SHong Zhang 273248a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27339566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27349566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 273516b64355SHong Zhang } 273616b64355SHong Zhang 273716b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 27389566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable *)&submatj->rmap)); 27399566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27409566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 274116b64355SHong Zhang #else 27429566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 274316b64355SHong Zhang #endif 274416b64355SHong Zhang 274516b64355SHong Zhang if (!submatj->allcolumns) { 274616b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 27479566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable *)&submatj->cmap)); 274816b64355SHong Zhang #else 27499566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 275016b64355SHong Zhang #endif 275116b64355SHong Zhang } 27529566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 275316b64355SHong Zhang 27549566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 275516b64355SHong Zhang PetscFunctionReturn(0); 275616b64355SHong Zhang } 275716b64355SHong Zhang 2758d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2759d71ae5a4SJacob Faibussowitsch { 276016b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27615c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 276216b64355SHong Zhang 276316b64355SHong Zhang PetscFunctionBegin; 27649566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27659566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 276616b64355SHong Zhang PetscFunctionReturn(0); 276716b64355SHong Zhang } 276816b64355SHong Zhang 276989a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2770d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2771d71ae5a4SJacob Faibussowitsch { 27722d033e1fSHong Zhang PetscInt i; 27730fb991dcSHong Zhang Mat C; 27740fb991dcSHong Zhang Mat_SeqAIJ *c; 27750fb991dcSHong Zhang Mat_SubSppt *submatj; 27762d033e1fSHong Zhang 27772d033e1fSHong Zhang PetscFunctionBegin; 27782d033e1fSHong Zhang for (i = 0; i < n; i++) { 27790fb991dcSHong Zhang C = (*mat)[i]; 27800fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27810fb991dcSHong Zhang submatj = c->submatis1; 27822d033e1fSHong Zhang if (submatj) { 2783682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 278426cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27859566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27869566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27879566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27883faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27899566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27909566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27919566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2792682e4c99SStefano Zampini } 27932d033e1fSHong Zhang } else { 27949566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 27952d033e1fSHong Zhang } 27962d033e1fSHong Zhang } 279786e85357SHong Zhang 279863a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 27999566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 280063a75b2aSHong Zhang 28019566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 28022d033e1fSHong Zhang PetscFunctionReturn(0); 28032d033e1fSHong Zhang } 28042d033e1fSHong Zhang 2805d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2806d71ae5a4SJacob Faibussowitsch { 280797f1f81fSBarry Smith PetscInt i; 2808cddf8d76SBarry Smith 28093a40ed3dSBarry Smith PetscFunctionBegin; 281048a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2811cddf8d76SBarry Smith 281248a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28133a40ed3dSBarry Smith PetscFunctionReturn(0); 2814cddf8d76SBarry Smith } 2815cddf8d76SBarry Smith 2816d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2817d71ae5a4SJacob Faibussowitsch { 2818e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28199a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28205d0c19d7SBarry Smith const PetscInt *idx; 28219a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2822f1af5d2fSBarry Smith PetscBT table; 2823bbd702dbSSatish Balay 28243a40ed3dSBarry Smith PetscFunctionBegin; 28259a88ca10SBarry Smith m = A->rmap->n / bs; 2826e4d965acSSatish Balay ai = a->i; 2827bfeeae90SHong Zhang aj = a->j; 28288a047759SSatish Balay 282908401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 283006763907SSatish Balay 28319566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28329566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 283306763907SSatish Balay 2834e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2835b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2836e4d965acSSatish Balay isz = 0; 28379566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2838e4d965acSSatish Balay 2839e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28409566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28419566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2842e4d965acSSatish Balay 28439a88ca10SBarry Smith if (bs > 1) { 28449a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28459a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28469a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28479a88ca10SBarry Smith } 28489a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28499a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28509a88ca10SBarry Smith 28519a88ca10SBarry Smith k = 0; 28529a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28539a88ca10SBarry Smith n = isz; 28549a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28559a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28569a88ca10SBarry Smith row = bs * nidx[k] + ll; 28579a88ca10SBarry Smith start = ai[row]; 28589a88ca10SBarry Smith end = ai[row + 1]; 28599a88ca10SBarry Smith for (l = start; l < end; l++) { 28609a88ca10SBarry Smith val = aj[l] / bs; 28619a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28629a88ca10SBarry Smith } 28639a88ca10SBarry Smith } 28649a88ca10SBarry Smith } 28659a88ca10SBarry Smith } 28669a88ca10SBarry Smith PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i))); 28679a88ca10SBarry Smith } else { 2868dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2869e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28702205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28714dcbc457SBarry Smith } 28729566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28739566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2874e4d965acSSatish Balay 287504a348a9SBarry Smith k = 0; 287604a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 287704a348a9SBarry Smith n = isz; 287806763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2879e4d965acSSatish Balay row = nidx[k]; 2880e4d965acSSatish Balay start = ai[row]; 2881e4d965acSSatish Balay end = ai[row + 1]; 288204a348a9SBarry Smith for (l = start; l < end; l++) { 2883efb16452SHong Zhang val = aj[l]; 28842205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2885e4d965acSSatish Balay } 2886e4d965acSSatish Balay } 2887e4d965acSSatish Balay } 28889566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2889e4d965acSSatish Balay } 28909a88ca10SBarry Smith } 28919566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28929566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28933a40ed3dSBarry Smith PetscFunctionReturn(0); 28944dcbc457SBarry Smith } 289517ab2063SBarry Smith 28960513a670SBarry Smith /* -------------------------------------------------------------- */ 2897d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2898d71ae5a4SJacob Faibussowitsch { 28990513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29003b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 29015d0c19d7SBarry Smith const PetscInt *row, *col; 29025d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 290356cd22aeSBarry Smith IS icolp, irowp; 29040298fd71SBarry Smith PetscInt *cwork = NULL; 29050298fd71SBarry Smith PetscScalar *vwork = NULL; 29060513a670SBarry Smith 29073a40ed3dSBarry Smith PetscFunctionBegin; 29089566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29099566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29109566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29119566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29120513a670SBarry Smith 29130513a670SBarry Smith /* determine lengths of permuted rows */ 29149566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29152205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29169566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29179566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29189566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29199566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29219566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29220513a670SBarry Smith 29239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29240513a670SBarry Smith for (i = 0; i < m; i++) { 29259566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29262205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29279566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29289566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29290513a670SBarry Smith } 29309566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29312205254eSKarl Rupp 29323c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29332205254eSKarl Rupp 29348c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29359566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29369fe5e383SStefano Zampini #endif 29379566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29389566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29399566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29409566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29419566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29429566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 294348a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29443a40ed3dSBarry Smith PetscFunctionReturn(0); 29450513a670SBarry Smith } 29460513a670SBarry Smith 2947d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2948d71ae5a4SJacob Faibussowitsch { 2949cb5b572fSBarry Smith PetscFunctionBegin; 295033f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 295133f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2952be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2953be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29542e5835c6SStefano Zampini const PetscScalar *aa; 2955be6bf707SBarry Smith 29569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 295708401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29589566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29599566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2961cb5b572fSBarry Smith } else { 29629566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2963cb5b572fSBarry Smith } 2964cb5b572fSBarry Smith PetscFunctionReturn(0); 2965cb5b572fSBarry Smith } 2966cb5b572fSBarry Smith 2967d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetUp_SeqAIJ(Mat A) 2968d71ae5a4SJacob Faibussowitsch { 2969273d9f13SBarry Smith PetscFunctionBegin; 29709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, PETSC_DEFAULT, NULL)); 2971273d9f13SBarry Smith PetscFunctionReturn(0); 2972273d9f13SBarry Smith } 2973273d9f13SBarry Smith 2974d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2975d71ae5a4SJacob Faibussowitsch { 29766c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29776e111a19SKarl Rupp 29786c0721eeSBarry Smith PetscFunctionBegin; 29796c0721eeSBarry Smith *array = a->a; 29806c0721eeSBarry Smith PetscFunctionReturn(0); 29816c0721eeSBarry Smith } 29826c0721eeSBarry Smith 2983d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2984d71ae5a4SJacob Faibussowitsch { 29856c0721eeSBarry Smith PetscFunctionBegin; 2986f38c1e66SStefano Zampini *array = NULL; 29876c0721eeSBarry Smith PetscFunctionReturn(0); 29886c0721eeSBarry Smith } 2989273d9f13SBarry Smith 29908229c054SShri Abhyankar /* 29918229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29928229c054SShri Abhyankar have different nonzero structure. 29938229c054SShri Abhyankar */ 2994d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2995d71ae5a4SJacob Faibussowitsch { 2996b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2997ec7775f6SShri Abhyankar 2998ec7775f6SShri Abhyankar PetscFunctionBegin; 2999ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 3000ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 3001b264fe52SHong Zhang const PetscInt *xjj = xj + xi[i], *yjj = yj + yi[i]; 3002b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 3003b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 30048af7cee1SJed Brown nnz[i] = 0; 30058af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 3006b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 3007b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 30088af7cee1SJed Brown nnz[i]++; 30098af7cee1SJed Brown } 30108af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 3011ec7775f6SShri Abhyankar } 3012ec7775f6SShri Abhyankar PetscFunctionReturn(0); 3013ec7775f6SShri Abhyankar } 3014ec7775f6SShri Abhyankar 3015d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3016d71ae5a4SJacob Faibussowitsch { 3017b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3018b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3019b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3020b264fe52SHong Zhang 3021b264fe52SHong Zhang PetscFunctionBegin; 3022b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30239566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 3024b264fe52SHong Zhang PetscFunctionReturn(0); 3025b264fe52SHong Zhang } 3026b264fe52SHong Zhang 3027d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3028d71ae5a4SJacob Faibussowitsch { 3029ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3030ac90fabeSBarry Smith 3031ac90fabeSBarry Smith PetscFunctionBegin; 3032134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3033134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3034134adf20SPierre Jolivet if (e) { 30359566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 303681fa06acSBarry Smith if (e) { 30379566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3038134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 303981fa06acSBarry Smith } 304081fa06acSBarry Smith } 304154c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 304281fa06acSBarry Smith } 3043ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30442e5835c6SStefano Zampini const PetscScalar *xa; 30452e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 304681fa06acSBarry Smith PetscBLASInt one = 1, bnz; 304781fa06acSBarry Smith 30489566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3051792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30549566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30569566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3057ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30589566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3059ac90fabeSBarry Smith } else { 30608229c054SShri Abhyankar Mat B; 30618229c054SShri Abhyankar PetscInt *nnz; 30629566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30639566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30649566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30659566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30669566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30679566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30699566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30709566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30719bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30729566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3073ac90fabeSBarry Smith } 3074ac90fabeSBarry Smith PetscFunctionReturn(0); 3075ac90fabeSBarry Smith } 3076ac90fabeSBarry Smith 3077d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3078d71ae5a4SJacob Faibussowitsch { 3079354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3080354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3081354c94deSBarry Smith PetscInt i, nz; 3082354c94deSBarry Smith PetscScalar *a; 3083354c94deSBarry Smith 3084354c94deSBarry Smith PetscFunctionBegin; 3085354c94deSBarry Smith nz = aij->nz; 30869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30872205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3089354c94deSBarry Smith #else 3090354c94deSBarry Smith PetscFunctionBegin; 3091354c94deSBarry Smith #endif 3092354c94deSBarry Smith PetscFunctionReturn(0); 3093354c94deSBarry Smith } 3094354c94deSBarry Smith 3095d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3096d71ae5a4SJacob Faibussowitsch { 3097e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3098d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3099e34fafa9SBarry Smith PetscReal atmp; 3100985db425SBarry Smith PetscScalar *x; 3101ce496241SStefano Zampini const MatScalar *aa, *av; 3102e34fafa9SBarry Smith 3103e34fafa9SBarry Smith PetscFunctionBegin; 310428b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3106ce496241SStefano Zampini aa = av; 3107e34fafa9SBarry Smith ai = a->i; 3108e34fafa9SBarry Smith aj = a->j; 3109e34fafa9SBarry Smith 31109566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31119566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31129566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 311308401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3114e34fafa9SBarry Smith for (i = 0; i < m; i++) { 31159371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31169371c9d4SSatish Balay ai++; 3117e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3118985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31199371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31209371c9d4SSatish Balay x[i] = atmp; 31219371c9d4SSatish Balay if (idx) idx[i] = *aj; 31229371c9d4SSatish Balay } 31239371c9d4SSatish Balay aa++; 31249371c9d4SSatish Balay aj++; 3125985db425SBarry Smith } 3126985db425SBarry Smith } 31279566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3129985db425SBarry Smith PetscFunctionReturn(0); 3130985db425SBarry Smith } 3131985db425SBarry Smith 3132d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3133d71ae5a4SJacob Faibussowitsch { 3134985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3135d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3136985db425SBarry Smith PetscScalar *x; 3137ce496241SStefano Zampini const MatScalar *aa, *av; 3138985db425SBarry Smith 3139985db425SBarry Smith PetscFunctionBegin; 314028b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3142ce496241SStefano Zampini aa = av; 3143985db425SBarry Smith ai = a->i; 3144985db425SBarry Smith aj = a->j; 3145985db425SBarry Smith 31469566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31479566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31489566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 314908401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3150985db425SBarry Smith for (i = 0; i < m; i++) { 31519371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31529371c9d4SSatish Balay ai++; 3153d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31549371c9d4SSatish Balay x[i] = *aa; 31559371c9d4SSatish Balay if (idx) idx[i] = 0; 3156985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3157985db425SBarry Smith x[i] = 0.0; 3158985db425SBarry Smith if (idx) { 3159985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3160985db425SBarry Smith if (aj[j] > j) { 3161985db425SBarry Smith idx[i] = j; 3162985db425SBarry Smith break; 3163985db425SBarry Smith } 3164985db425SBarry Smith } 31651a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31661a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3167985db425SBarry Smith } 3168985db425SBarry Smith } 3169985db425SBarry Smith for (j = 0; j < ncols; j++) { 31709371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31719371c9d4SSatish Balay x[i] = *aa; 31729371c9d4SSatish Balay if (idx) idx[i] = *aj; 31739371c9d4SSatish Balay } 31749371c9d4SSatish Balay aa++; 31759371c9d4SSatish Balay aj++; 3176985db425SBarry Smith } 3177985db425SBarry Smith } 31789566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3180985db425SBarry Smith PetscFunctionReturn(0); 3181985db425SBarry Smith } 3182985db425SBarry Smith 3183d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3184d71ae5a4SJacob Faibussowitsch { 3185c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3186c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3187ce496241SStefano Zampini PetscScalar *x; 3188ce496241SStefano Zampini const MatScalar *aa, *av; 3189c87e5d42SMatthew Knepley 3190c87e5d42SMatthew Knepley PetscFunctionBegin; 31919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3192ce496241SStefano Zampini aa = av; 3193c87e5d42SMatthew Knepley ai = a->i; 3194c87e5d42SMatthew Knepley aj = a->j; 3195c87e5d42SMatthew Knepley 31969566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31979566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31989566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 319908401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3200c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 32019371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32029371c9d4SSatish Balay ai++; 3203f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32049371c9d4SSatish Balay x[i] = *aa; 32059371c9d4SSatish Balay if (idx) idx[i] = 0; 3206f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3207f07e67edSHong Zhang x[i] = 0.0; 3208f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3209289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3210f07e67edSHong Zhang if (aj[j] > j) { 3211f07e67edSHong Zhang idx[i] = j; 32122205254eSKarl Rupp break; 32132205254eSKarl Rupp } 3214289a08f5SMatthew Knepley } 3215f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3216f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3217f07e67edSHong Zhang } 3218289a08f5SMatthew Knepley } 3219c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32209371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32219371c9d4SSatish Balay x[i] = *aa; 32229371c9d4SSatish Balay if (idx) idx[i] = *aj; 32239371c9d4SSatish Balay } 32249371c9d4SSatish Balay aa++; 32259371c9d4SSatish Balay aj++; 3226c87e5d42SMatthew Knepley } 3227c87e5d42SMatthew Knepley } 32289566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3230c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3231c87e5d42SMatthew Knepley } 3232c87e5d42SMatthew Knepley 3233d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3234d71ae5a4SJacob Faibussowitsch { 3235985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3236d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3237d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3238985db425SBarry Smith PetscScalar *x; 3239ce496241SStefano Zampini const MatScalar *aa, *av; 3240985db425SBarry Smith 3241985db425SBarry Smith PetscFunctionBegin; 324228b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3244ce496241SStefano Zampini aa = av; 3245985db425SBarry Smith ai = a->i; 3246985db425SBarry Smith aj = a->j; 3247985db425SBarry Smith 32489566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32499566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32509566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 325108401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3252985db425SBarry Smith for (i = 0; i < m; i++) { 32539371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32549371c9d4SSatish Balay ai++; 3255d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32569371c9d4SSatish Balay x[i] = *aa; 32579371c9d4SSatish Balay if (idx) idx[i] = 0; 3258985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3259985db425SBarry Smith x[i] = 0.0; 3260985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3261985db425SBarry Smith for (j = 0; j < ncols; j++) { 3262985db425SBarry Smith if (aj[j] > j) { 3263985db425SBarry Smith idx[i] = j; 3264985db425SBarry Smith break; 3265985db425SBarry Smith } 3266985db425SBarry Smith } 3267fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3268fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3269985db425SBarry Smith } 3270985db425SBarry Smith } 3271985db425SBarry Smith for (j = 0; j < ncols; j++) { 32729371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32739371c9d4SSatish Balay x[i] = *aa; 32749371c9d4SSatish Balay if (idx) idx[i] = *aj; 32759371c9d4SSatish Balay } 32769371c9d4SSatish Balay aa++; 32779371c9d4SSatish Balay aj++; 3278e34fafa9SBarry Smith } 3279e34fafa9SBarry Smith } 32809566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3282e34fafa9SBarry Smith PetscFunctionReturn(0); 3283e34fafa9SBarry Smith } 3284bbead8a2SBarry Smith 3285d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3286d71ae5a4SJacob Faibussowitsch { 3287bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 328833d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3289bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 32900da83c2eSBarry Smith const PetscReal shift = 0.0; 32911a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3292bbead8a2SBarry Smith 3293bbead8a2SBarry Smith PetscFunctionBegin; 3294a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 32954a0d0026SBarry Smith if (a->ibdiagvalid) { 32964a0d0026SBarry Smith if (values) *values = a->ibdiag; 32974a0d0026SBarry Smith PetscFunctionReturn(0); 32984a0d0026SBarry Smith } 32999566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 33004dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3301bbead8a2SBarry Smith diag = a->ibdiag; 3302bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3303bbead8a2SBarry Smith /* factor and invert each block */ 3304bbead8a2SBarry Smith switch (bs) { 3305bbead8a2SBarry Smith case 1: 3306bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33079566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3308ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3309ec1892c8SHong Zhang if (allowzeropivot) { 33107b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33117b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33127b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33139566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 331498921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3315ec1892c8SHong Zhang } 3316bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3317bbead8a2SBarry Smith } 3318bbead8a2SBarry Smith break; 3319bbead8a2SBarry Smith case 2: 3320bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33219371c9d4SSatish Balay ij[0] = 2 * i; 33229371c9d4SSatish Balay ij[1] = 2 * i + 1; 33239566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33249566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33257b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33269566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3327bbead8a2SBarry Smith diag += 4; 3328bbead8a2SBarry Smith } 3329bbead8a2SBarry Smith break; 3330bbead8a2SBarry Smith case 3: 3331bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33329371c9d4SSatish Balay ij[0] = 3 * i; 33339371c9d4SSatish Balay ij[1] = 3 * i + 1; 33349371c9d4SSatish Balay ij[2] = 3 * i + 2; 33359566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33369566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33377b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33389566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3339bbead8a2SBarry Smith diag += 9; 3340bbead8a2SBarry Smith } 3341bbead8a2SBarry Smith break; 3342bbead8a2SBarry Smith case 4: 3343bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33449371c9d4SSatish Balay ij[0] = 4 * i; 33459371c9d4SSatish Balay ij[1] = 4 * i + 1; 33469371c9d4SSatish Balay ij[2] = 4 * i + 2; 33479371c9d4SSatish Balay ij[3] = 4 * i + 3; 33489566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33499566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33507b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33519566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3352bbead8a2SBarry Smith diag += 16; 3353bbead8a2SBarry Smith } 3354bbead8a2SBarry Smith break; 3355bbead8a2SBarry Smith case 5: 3356bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33579371c9d4SSatish Balay ij[0] = 5 * i; 33589371c9d4SSatish Balay ij[1] = 5 * i + 1; 33599371c9d4SSatish Balay ij[2] = 5 * i + 2; 33609371c9d4SSatish Balay ij[3] = 5 * i + 3; 33619371c9d4SSatish Balay ij[4] = 5 * i + 4; 33629566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33639566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33647b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33659566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3366bbead8a2SBarry Smith diag += 25; 3367bbead8a2SBarry Smith } 3368bbead8a2SBarry Smith break; 3369bbead8a2SBarry Smith case 6: 3370bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33719371c9d4SSatish Balay ij[0] = 6 * i; 33729371c9d4SSatish Balay ij[1] = 6 * i + 1; 33739371c9d4SSatish Balay ij[2] = 6 * i + 2; 33749371c9d4SSatish Balay ij[3] = 6 * i + 3; 33759371c9d4SSatish Balay ij[4] = 6 * i + 4; 33769371c9d4SSatish Balay ij[5] = 6 * i + 5; 33779566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33789566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33797b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33809566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3381bbead8a2SBarry Smith diag += 36; 3382bbead8a2SBarry Smith } 3383bbead8a2SBarry Smith break; 3384bbead8a2SBarry Smith case 7: 3385bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33869371c9d4SSatish Balay ij[0] = 7 * i; 33879371c9d4SSatish Balay ij[1] = 7 * i + 1; 33889371c9d4SSatish Balay ij[2] = 7 * i + 2; 33899371c9d4SSatish Balay ij[3] = 7 * i + 3; 33909371c9d4SSatish Balay ij[4] = 7 * i + 4; 33919371c9d4SSatish Balay ij[5] = 7 * i + 5; 3392cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 33939566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 33949566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 33957b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33969566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3397bbead8a2SBarry Smith diag += 49; 3398bbead8a2SBarry Smith } 3399bbead8a2SBarry Smith break; 3400bbead8a2SBarry Smith default: 34019566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3402bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3403ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34049566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34059566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34067b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34079566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3408bbead8a2SBarry Smith diag += bs2; 3409bbead8a2SBarry Smith } 34109566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3411bbead8a2SBarry Smith } 3412bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3413bbead8a2SBarry Smith PetscFunctionReturn(0); 3414bbead8a2SBarry Smith } 3415bbead8a2SBarry Smith 3416d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3417d71ae5a4SJacob Faibussowitsch { 341873a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3419fff043a9SJunchao Zhang PetscScalar a, *aa; 342073a71a0fSBarry Smith PetscInt m, n, i, j, col; 342173a71a0fSBarry Smith 342273a71a0fSBarry Smith PetscFunctionBegin; 342373a71a0fSBarry Smith if (!x->assembled) { 34249566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 342573a71a0fSBarry Smith for (i = 0; i < m; i++) { 342673a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34279566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 342873a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34299566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 343073a71a0fSBarry Smith } 343173a71a0fSBarry Smith } 3432e2ce353bSJunchao Zhang } else { 34339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34349566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3436e2ce353bSJunchao Zhang } 34379566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34389566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 343973a71a0fSBarry Smith PetscFunctionReturn(0); 344073a71a0fSBarry Smith } 344173a71a0fSBarry Smith 3442679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3443d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3444d71ae5a4SJacob Faibussowitsch { 3445679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3446679944adSJunchao Zhang PetscScalar a; 3447679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3448679944adSJunchao Zhang 3449679944adSJunchao Zhang PetscFunctionBegin; 3450679944adSJunchao Zhang nskip = high - low; 34519566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3452679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3453679944adSJunchao Zhang for (i = 0; i < m; i++) { 3454679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34559566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3456679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3457679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34589566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3459679944adSJunchao Zhang } 3460e2ce353bSJunchao Zhang } 34619566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34629566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 3463679944adSJunchao Zhang PetscFunctionReturn(0); 3464679944adSJunchao Zhang } 3465679944adSJunchao Zhang 3466682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 34670a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3468cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3469cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3470cb5b572fSBarry Smith MatMult_SeqAIJ, 347197304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34727c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34737c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3474f4259b30SLisandro Dalcin NULL, 3475f4259b30SLisandro Dalcin NULL, 3476f4259b30SLisandro Dalcin NULL, 3477f4259b30SLisandro Dalcin /* 10*/ NULL, 3478cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3479f4259b30SLisandro Dalcin NULL, 348041f059aeSBarry Smith MatSOR_SeqAIJ, 348191e9d3e2SHong Zhang MatTranspose_SeqAIJ, 348297304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3483cb5b572fSBarry Smith MatEqual_SeqAIJ, 3484cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3485cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3486cb5b572fSBarry Smith MatNorm_SeqAIJ, 3487f4259b30SLisandro Dalcin /* 20*/ NULL, 3488cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3489cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3490cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3491d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3492f4259b30SLisandro Dalcin NULL, 3493f4259b30SLisandro Dalcin NULL, 3494f4259b30SLisandro Dalcin NULL, 3495f4259b30SLisandro Dalcin NULL, 34964994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3497f4259b30SLisandro Dalcin NULL, 3498f4259b30SLisandro Dalcin NULL, 3499f4259b30SLisandro Dalcin NULL, 3500f4259b30SLisandro Dalcin NULL, 3501d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3502f4259b30SLisandro Dalcin NULL, 3503f4259b30SLisandro Dalcin NULL, 3504cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3505f4259b30SLisandro Dalcin NULL, 3506d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35077dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3508cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3509cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3510cb5b572fSBarry Smith MatCopy_SeqAIJ, 3511d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3512cb5b572fSBarry Smith MatScale_SeqAIJ, 35137d68702bSBarry Smith MatShift_SeqAIJ, 351479299369SBarry Smith MatDiagonalSet_SeqAIJ, 35156e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 351673a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35173b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35183b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35193b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3520a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 352193dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3522f4259b30SLisandro Dalcin NULL, 3523f4259b30SLisandro Dalcin NULL, 3524cda55fadSBarry Smith MatPermute_SeqAIJ, 3525f4259b30SLisandro Dalcin NULL, 3526f4259b30SLisandro Dalcin /* 59*/ NULL, 3527b9b97703SBarry Smith MatDestroy_SeqAIJ, 3528b9b97703SBarry Smith MatView_SeqAIJ, 3529f4259b30SLisandro Dalcin NULL, 3530f4259b30SLisandro Dalcin NULL, 3531f4259b30SLisandro Dalcin /* 64*/ NULL, 3532321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3533f4259b30SLisandro Dalcin NULL, 3534f4259b30SLisandro Dalcin NULL, 3535f4259b30SLisandro Dalcin NULL, 3536d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3537c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3538f4259b30SLisandro Dalcin NULL, 3539f4259b30SLisandro Dalcin NULL, 3540f4259b30SLisandro Dalcin NULL, 3541f4259b30SLisandro Dalcin /* 74*/ NULL, 35423acb8795SBarry Smith MatFDColoringApply_AIJ, 3543f4259b30SLisandro Dalcin NULL, 3544f4259b30SLisandro Dalcin NULL, 3545f4259b30SLisandro Dalcin NULL, 35466ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3547f4259b30SLisandro Dalcin NULL, 3548f4259b30SLisandro Dalcin NULL, 3549f4259b30SLisandro Dalcin NULL, 3550bc011b1eSHong Zhang MatLoad_SeqAIJ, 3551d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35521cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3553f4259b30SLisandro Dalcin NULL, 3554f4259b30SLisandro Dalcin NULL, 3555f4259b30SLisandro Dalcin NULL, 3556f4259b30SLisandro Dalcin /* 89*/ NULL, 3557f4259b30SLisandro Dalcin NULL, 355826be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3559f4259b30SLisandro Dalcin NULL, 3560f4259b30SLisandro Dalcin NULL, 35618fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3562f4259b30SLisandro Dalcin NULL, 3563f4259b30SLisandro Dalcin NULL, 35646fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3565f4259b30SLisandro Dalcin NULL, 35664222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3567f4259b30SLisandro Dalcin NULL, 3568f4259b30SLisandro Dalcin NULL, 356987d4246cSBarry Smith MatConjugate_SeqAIJ, 3570f4259b30SLisandro Dalcin NULL, 3571d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 357299cafbc1SBarry Smith MatRealPart_SeqAIJ, 3573f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3574f4259b30SLisandro Dalcin NULL, 3575f4259b30SLisandro Dalcin NULL, 3576cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3577f4259b30SLisandro Dalcin NULL, 35782af78befSBarry Smith MatGetRowMin_SeqAIJ, 3579f4259b30SLisandro Dalcin NULL, 3580599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3581f4259b30SLisandro Dalcin /*114*/ NULL, 3582f4259b30SLisandro Dalcin NULL, 3583f4259b30SLisandro Dalcin NULL, 3584f4259b30SLisandro Dalcin NULL, 3585f4259b30SLisandro Dalcin NULL, 3586f4259b30SLisandro Dalcin /*119*/ NULL, 3587f4259b30SLisandro Dalcin NULL, 3588f4259b30SLisandro Dalcin NULL, 3589f4259b30SLisandro Dalcin NULL, 3590b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 35910716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3592a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 359337868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 35940da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3595f4259b30SLisandro Dalcin NULL, 3596f4259b30SLisandro Dalcin /*129*/ NULL, 3597f4259b30SLisandro Dalcin NULL, 3598f4259b30SLisandro Dalcin NULL, 359975648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3600b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3601b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36022b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3603f4259b30SLisandro Dalcin NULL, 3604f4259b30SLisandro Dalcin NULL, 36053964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3606f4259b30SLisandro Dalcin /*139*/ NULL, 3607f4259b30SLisandro Dalcin NULL, 3608f4259b30SLisandro Dalcin NULL, 36093a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36109c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36114222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36124222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3613f4259b30SLisandro Dalcin NULL, 361472833a62Smarkadams4 NULL, 361572833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36162d776b49SBarry Smith NULL, 36179371c9d4SSatish Balay /*150*/ MatTransposeSymbolic_SeqAIJ}; 361817ab2063SBarry Smith 3619d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3620d71ae5a4SJacob Faibussowitsch { 3621bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 362297f1f81fSBarry Smith PetscInt i, nz, n; 3623bef8e0ddSBarry Smith 3624bef8e0ddSBarry Smith PetscFunctionBegin; 3625bef8e0ddSBarry Smith nz = aij->maxnz; 3626d0f46423SBarry Smith n = mat->rmap->n; 3627ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3628bef8e0ddSBarry Smith aij->nz = nz; 3629ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 3630bef8e0ddSBarry Smith PetscFunctionReturn(0); 3631bef8e0ddSBarry Smith } 3632bef8e0ddSBarry Smith 3633a3bb6f32SFande Kong /* 3634ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3635ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3636ddea5d60SJunchao Zhang */ 3637d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3638d71ae5a4SJacob Faibussowitsch { 3639a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3640a3bb6f32SFande Kong PetscTable gid1_lid1; 3641a3bb6f32SFande Kong PetscTablePosition tpos; 364225b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 364325b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3644a3bb6f32SFande Kong 3645a3bb6f32SFande Kong PetscFunctionBegin; 3646a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3647a3bb6f32SFande Kong PetscValidPointer(mapping, 2); 3648a3bb6f32SFande Kong /* use a table */ 36499566063dSJacob Faibussowitsch PetscCall(PetscTableCreate(mat->rmap->n, mat->cmap->N + 1, &gid1_lid1)); 3650a3bb6f32SFande Kong ec = 0; 365125b670f0SStefano Zampini for (i = 0; i < nz; i++) { 365225b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 36539566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1, gid1, &data)); 3654a3bb6f32SFande Kong if (!data) { 3655a3bb6f32SFande Kong /* one based table */ 36569566063dSJacob Faibussowitsch PetscCall(PetscTableAdd(gid1_lid1, gid1, ++ec, INSERT_VALUES)); 3657a3bb6f32SFande Kong } 3658a3bb6f32SFande Kong } 3659a3bb6f32SFande Kong /* form array of columns we need */ 36609566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 36619566063dSJacob Faibussowitsch PetscCall(PetscTableGetHeadPosition(gid1_lid1, &tpos)); 3662a3bb6f32SFande Kong while (tpos) { 36639566063dSJacob Faibussowitsch PetscCall(PetscTableGetNext(gid1_lid1, &tpos, &gid, &lid)); 3664a3bb6f32SFande Kong gid--; 3665a3bb6f32SFande Kong lid--; 3666a3bb6f32SFande Kong garray[lid] = gid; 3667a3bb6f32SFande Kong } 36689566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 36699566063dSJacob Faibussowitsch PetscCall(PetscTableRemoveAll(gid1_lid1)); 367048a46eb9SPierre Jolivet for (i = 0; i < ec; i++) PetscCall(PetscTableAdd(gid1_lid1, garray[i] + 1, i + 1, INSERT_VALUES)); 3671a3bb6f32SFande Kong /* compact out the extra columns in B */ 367225b670f0SStefano Zampini for (i = 0; i < nz; i++) { 367325b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 36749566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1, gid1, &lid)); 3675a3bb6f32SFande Kong lid--; 367625b670f0SStefano Zampini jj[i] = lid; 3677a3bb6f32SFande Kong } 36789566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 36799566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy(&gid1_lid1)); 36809566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36819566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36829566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 3683a3bb6f32SFande Kong PetscFunctionReturn(0); 3684a3bb6f32SFande Kong } 3685a3bb6f32SFande Kong 3686bef8e0ddSBarry Smith /*@ 3687bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3688bef8e0ddSBarry Smith in the matrix. 3689bef8e0ddSBarry Smith 3690bef8e0ddSBarry Smith Input Parameters: 369111a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3692bef8e0ddSBarry Smith - indices - the column indices 3693bef8e0ddSBarry Smith 369415091d37SBarry Smith Level: advanced 369515091d37SBarry Smith 3696bef8e0ddSBarry Smith Notes: 3697bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3698bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 369911a5261eSBarry Smith of the `MatSetValues()` operation. 3700bef8e0ddSBarry Smith 3701bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 370211a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3703bef8e0ddSBarry Smith 370411a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3705bef8e0ddSBarry Smith 3706b9617806SBarry Smith The indices should start with zero, not one. 3707b9617806SBarry Smith 3708bef8e0ddSBarry Smith @*/ 3709d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3710d71ae5a4SJacob Faibussowitsch { 3711bef8e0ddSBarry Smith PetscFunctionBegin; 37120700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3713dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 3714cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 3715bef8e0ddSBarry Smith PetscFunctionReturn(0); 3716bef8e0ddSBarry Smith } 3717bef8e0ddSBarry Smith 3718be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3719be6bf707SBarry Smith 3720d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3721d71ae5a4SJacob Faibussowitsch { 3722be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3723d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3724be6bf707SBarry Smith 3725be6bf707SBarry Smith PetscFunctionBegin; 372628b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3727be6bf707SBarry Smith 3728be6bf707SBarry Smith /* allocate space for values if not already there */ 37294dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3730be6bf707SBarry Smith 3731be6bf707SBarry Smith /* copy values over */ 37329566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 3733be6bf707SBarry Smith PetscFunctionReturn(0); 3734be6bf707SBarry Smith } 3735be6bf707SBarry Smith 3736be6bf707SBarry Smith /*@ 3737be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3738be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3739be6bf707SBarry Smith nonlinear portion. 3740be6bf707SBarry Smith 3741c3339decSBarry Smith Logically Collect 3742be6bf707SBarry Smith 3743be6bf707SBarry Smith Input Parameters: 374411a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3745be6bf707SBarry Smith 374615091d37SBarry Smith Level: advanced 374715091d37SBarry Smith 374811a5261eSBarry Smith Common Usage, with `SNESSolve()`: 3749be6bf707SBarry Smith $ Create Jacobian matrix 3750be6bf707SBarry Smith $ Set linear terms into matrix 3751be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3752be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3753be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3754512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3755be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3756be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3757be6bf707SBarry Smith $ In your Jacobian routine 3758be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3759be6bf707SBarry Smith $ Set nonlinear terms in matrix 3760be6bf707SBarry Smith 3761be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3762be6bf707SBarry Smith $ // build linear portion of Jacobian 3763512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3764be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3765be6bf707SBarry Smith $ loop over nonlinear iterations 3766be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3767be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3768be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3769be6bf707SBarry Smith $ Solve linear system with Jacobian 3770be6bf707SBarry Smith $ endloop 3771be6bf707SBarry Smith 3772be6bf707SBarry Smith Notes: 3773da81f932SPierre Jolivet Matrix must already be assembled before calling this routine 377411a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3775be6bf707SBarry Smith calling this routine. 3776be6bf707SBarry Smith 37770c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37780c468ba9SBarry Smith and does not allocated additional space. 37790c468ba9SBarry Smith 3780db781477SPatrick Sanan .seealso: `MatRetrieveValues()` 3781be6bf707SBarry Smith @*/ 3782d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3783d71ae5a4SJacob Faibussowitsch { 3784be6bf707SBarry Smith PetscFunctionBegin; 37850700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 378628b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 378728b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3788cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 3789be6bf707SBarry Smith PetscFunctionReturn(0); 3790be6bf707SBarry Smith } 3791be6bf707SBarry Smith 3792d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3793d71ae5a4SJacob Faibussowitsch { 3794be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3795d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3796be6bf707SBarry Smith 3797be6bf707SBarry Smith PetscFunctionBegin; 379828b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 379928b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3800be6bf707SBarry Smith /* copy values over */ 38019566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 3802be6bf707SBarry Smith PetscFunctionReturn(0); 3803be6bf707SBarry Smith } 3804be6bf707SBarry Smith 3805be6bf707SBarry Smith /*@ 3806be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3807be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3808be6bf707SBarry Smith nonlinear portion. 3809be6bf707SBarry Smith 3810c3339decSBarry Smith Logically Collect 3811be6bf707SBarry Smith 3812be6bf707SBarry Smith Input Parameters: 381311a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3814be6bf707SBarry Smith 381515091d37SBarry Smith Level: advanced 381615091d37SBarry Smith 3817db781477SPatrick Sanan .seealso: `MatStoreValues()` 3818be6bf707SBarry Smith @*/ 3819d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3820d71ae5a4SJacob Faibussowitsch { 3821be6bf707SBarry Smith PetscFunctionBegin; 38220700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 382328b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 382428b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3825cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 3826be6bf707SBarry Smith PetscFunctionReturn(0); 3827be6bf707SBarry Smith } 3828be6bf707SBarry Smith 3829be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 383017ab2063SBarry Smith /*@C 383111a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38320d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 38336e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 383451c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 38352bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 383617ab2063SBarry Smith 3837d083f849SBarry Smith Collective 3838db81eaa0SLois Curfman McInnes 383917ab2063SBarry Smith Input Parameters: 384011a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 384117ab2063SBarry Smith . m - number of rows 384217ab2063SBarry Smith . n - number of columns 384317ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 384451c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38450298fd71SBarry Smith (possibly different for each row) or NULL 384617ab2063SBarry Smith 384717ab2063SBarry Smith Output Parameter: 3848416022c9SBarry Smith . A - the matrix 384917ab2063SBarry Smith 385011a5261eSBarry Smith It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 3851f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 385211a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 3853175b88e8SBarry Smith 3854b259b22eSLois Curfman McInnes Notes: 385549a6f317SBarry Smith If nnz is given then nz is ignored 385649a6f317SBarry Smith 385711a5261eSBarry Smith The AIJ format, also called 385811a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 38590002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 386044cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 386117ab2063SBarry Smith 386217ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 386311a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 38643d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 38656da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 386617ab2063SBarry Smith 3867682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38684fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3869682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38706c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38716c7ebb05SLois Curfman McInnes 38726c7ebb05SLois Curfman McInnes Options Database Keys: 3873698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 38749db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 387517ab2063SBarry Smith 3876027ccd11SLois Curfman McInnes Level: intermediate 3877027ccd11SLois Curfman McInnes 387860161072SBarry Smith .seealso: [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 387917ab2063SBarry Smith @*/ 3880d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3881d71ae5a4SJacob Faibussowitsch { 38823a40ed3dSBarry Smith PetscFunctionBegin; 38839566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38849566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38859566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 3887273d9f13SBarry Smith PetscFunctionReturn(0); 3888273d9f13SBarry Smith } 3889273d9f13SBarry Smith 3890273d9f13SBarry Smith /*@C 3891273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3892273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3893273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3894273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3895273d9f13SBarry Smith 3896d083f849SBarry Smith Collective 3897273d9f13SBarry Smith 3898273d9f13SBarry Smith Input Parameters: 38991c4f3114SJed Brown + B - The matrix 3900273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3901273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39020298fd71SBarry Smith (possibly different for each row) or NULL 3903273d9f13SBarry Smith 3904273d9f13SBarry Smith Notes: 390549a6f317SBarry Smith If nnz is given then nz is ignored 390649a6f317SBarry Smith 390711a5261eSBarry Smith The `MATSEQAIJ` format also called 390811a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 3909273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3910273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3911273d9f13SBarry Smith 3912273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 391311a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 3914273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3915273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3916273d9f13SBarry Smith 391711a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3918aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3919aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3920aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3921aa95bbe8SBarry Smith 392211a5261eSBarry Smith Developer Notes: 392311a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3924a96a251dSBarry Smith entries or columns indices 3925a96a251dSBarry Smith 3926273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3927273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3928273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3929273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3930273d9f13SBarry Smith 3931273d9f13SBarry Smith Options Database Keys: 3932698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 393347b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3934273d9f13SBarry Smith 3935273d9f13SBarry Smith Level: intermediate 3936273d9f13SBarry Smith 3937db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3938db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3939273d9f13SBarry Smith @*/ 3940d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3941d71ae5a4SJacob Faibussowitsch { 3942a23d5eceSKris Buschelman PetscFunctionBegin; 39436ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39446ba663aaSJed Brown PetscValidType(B, 1); 3945cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 3946a23d5eceSKris Buschelman PetscFunctionReturn(0); 3947a23d5eceSKris Buschelman } 3948a23d5eceSKris Buschelman 3949d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3950d71ae5a4SJacob Faibussowitsch { 3951273d9f13SBarry Smith Mat_SeqAIJ *b; 39522576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 395397f1f81fSBarry Smith PetscInt i; 3954273d9f13SBarry Smith 3955273d9f13SBarry Smith PetscFunctionBegin; 39562576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3957a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3958c461c341SBarry Smith skipallocation = PETSC_TRUE; 3959c461c341SBarry Smith nz = 0; 3960c461c341SBarry Smith } 39619566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39629566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3963899cda47SBarry Smith 3964435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 396508401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 3966cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3967d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 396808401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 396908401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3970b73539f3SBarry Smith } 3971b73539f3SBarry Smith } 3972b73539f3SBarry Smith 3973273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 39742205254eSKarl Rupp 3975273d9f13SBarry Smith b = (Mat_SeqAIJ *)B->data; 3976273d9f13SBarry Smith 3977ab93d7beSBarry Smith if (!skipallocation) { 39784dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3979071fcb05SBarry Smith if (!b->ilen) { 3980071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39819566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3982071fcb05SBarry Smith } else { 39839566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39842ee49352SLisandro Dalcin } 39854dfa11a4SJacob Faibussowitsch if (!b->ipre) { PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); } 3986273d9f13SBarry Smith if (!nnz) { 3987435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3988c62bd62aSJed Brown else if (nz < 0) nz = 1; 39895d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 3990d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 3991d0f46423SBarry Smith nz = nz * B->rmap->n; 3992273d9f13SBarry Smith } else { 3993c73702f5SBarry Smith PetscInt64 nz64 = 0; 39949371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 39959371c9d4SSatish Balay b->imax[i] = nnz[i]; 39969371c9d4SSatish Balay nz64 += nnz[i]; 39979371c9d4SSatish Balay } 39989566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 3999273d9f13SBarry Smith } 4000ab93d7beSBarry Smith 4001273d9f13SBarry Smith /* allocate the matrix space */ 400253dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 40039566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 4004396832f4SHong Zhang if (B->structure_only) { 40059566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &b->j)); 40069566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i)); 4007396832f4SHong Zhang } else { 40089566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i)); 4009396832f4SHong Zhang } 4010bfeeae90SHong Zhang b->i[0] = 0; 4011ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4012396832f4SHong Zhang if (B->structure_only) { 4013396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4014396832f4SHong Zhang b->free_a = PETSC_FALSE; 4015396832f4SHong Zhang } else { 4016273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4017e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4018396832f4SHong Zhang } 4019e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4020c461c341SBarry Smith } else { 4021e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4022e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4023c461c341SBarry Smith } 4024273d9f13SBarry Smith 4025846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4026846b4da1SFande Kong /* reserve user-requested sparsity */ 40279566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4028846b4da1SFande Kong } 4029846b4da1SFande Kong 4030273d9f13SBarry Smith b->nz = 0; 4031273d9f13SBarry Smith b->maxnz = nz; 4032273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40331baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4034cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4035cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40365519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40375519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40385519a089SJose E. Roman */ 40395519a089SJose E. Roman B->nonzerostate++; 4040273d9f13SBarry Smith PetscFunctionReturn(0); 4041273d9f13SBarry Smith } 4042273d9f13SBarry Smith 4043d71ae5a4SJacob Faibussowitsch PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4044d71ae5a4SJacob Faibussowitsch { 4045846b4da1SFande Kong Mat_SeqAIJ *a; 4046a5bbaf83SFande Kong PetscInt i; 4047846b4da1SFande Kong 4048846b4da1SFande Kong PetscFunctionBegin; 4049846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 405014d0e64fSAlex Lindsay 405114d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 405214d0e64fSAlex Lindsay if (!A->rmap->n) PetscFunctionReturn(0); 405314d0e64fSAlex Lindsay 4054846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40552c814fdeSFande Kong /* if no saved info, we error out */ 405628b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40572c814fdeSFande Kong 4058aed4548fSBarry Smith PetscCheck(a->i && a->j && a->a && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40592c814fdeSFande Kong 40609566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40619566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4062846b4da1SFande Kong a->i[0] = 0; 4063ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4064846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4065846b4da1SFande Kong a->nz = 0; 4066846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4067846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4068846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4069846b4da1SFande Kong A->assembled = PETSC_FALSE; 4070846b4da1SFande Kong PetscFunctionReturn(0); 4071846b4da1SFande Kong } 4072846b4da1SFande Kong 407358d36128SBarry Smith /*@ 407411a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4075a1661176SMatthew Knepley 4076a1661176SMatthew Knepley Input Parameters: 4077a1661176SMatthew Knepley + B - the matrix 4078a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4079a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4080a1661176SMatthew Knepley - v - optional values in the matrix 4081a1661176SMatthew Knepley 4082a1661176SMatthew Knepley Level: developer 4083a1661176SMatthew Knepley 40846a9b8d82SBarry Smith Notes: 408511a5261eSBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 408658d36128SBarry Smith 40876a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 40886a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 40896a9b8d82SBarry Smith 40906a9b8d82SBarry Smith Developer Notes: 40916a9b8d82SBarry Smith An optimization could be added to the implementation where it checks if the i, and j are identical to the current i and j and 409211a5261eSBarry Smith then just copies the v values directly with `PetscMemcpy()`. 40936a9b8d82SBarry Smith 409411a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 40956a9b8d82SBarry Smith 4096db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MatResetPreallocation()` 4097a1661176SMatthew Knepley @*/ 4098d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4099d71ae5a4SJacob Faibussowitsch { 4100a1661176SMatthew Knepley PetscFunctionBegin; 41010700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 41026ba663aaSJed Brown PetscValidType(B, 1); 4103cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 4104a1661176SMatthew Knepley PetscFunctionReturn(0); 4105a1661176SMatthew Knepley } 4106a1661176SMatthew Knepley 4107d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4108d71ae5a4SJacob Faibussowitsch { 4109a1661176SMatthew Knepley PetscInt i; 4110a1661176SMatthew Knepley PetscInt m, n; 4111a1661176SMatthew Knepley PetscInt nz; 41126a9b8d82SBarry Smith PetscInt *nnz; 4113a1661176SMatthew Knepley 4114a1661176SMatthew Knepley PetscFunctionBegin; 4115aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4116779a8d59SSatish Balay 41179566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41189566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4119779a8d59SSatish Balay 41209566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41219566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4122a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4123b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 412408401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4125a1661176SMatthew Knepley nnz[i] = nz; 4126a1661176SMatthew Knepley } 41279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41289566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4129a1661176SMatthew Knepley 413048a46eb9SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES)); 4131a1661176SMatthew Knepley 41329566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41339566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4134a1661176SMatthew Knepley 41359566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 4136a1661176SMatthew Knepley PetscFunctionReturn(0); 4137a1661176SMatthew Knepley } 4138a1661176SMatthew Knepley 4139ad7e164aSPierre Jolivet /*@ 4140ad7e164aSPierre Jolivet MatSeqAIJKron - Computes C, the Kronecker product of A and B. 4141ad7e164aSPierre Jolivet 4142ad7e164aSPierre Jolivet Input Parameters: 4143ad7e164aSPierre Jolivet + A - left-hand side matrix 4144ad7e164aSPierre Jolivet . B - right-hand side matrix 414511a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4146ad7e164aSPierre Jolivet 4147ad7e164aSPierre Jolivet Output Parameter: 4148ad7e164aSPierre Jolivet . C - Kronecker product of A and B 4149ad7e164aSPierre Jolivet 4150ad7e164aSPierre Jolivet Level: intermediate 4151ad7e164aSPierre Jolivet 415211a5261eSBarry Smith Note: 415311a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4154ad7e164aSPierre Jolivet 4155db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4156ad7e164aSPierre Jolivet @*/ 4157d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4158d71ae5a4SJacob Faibussowitsch { 4159ad7e164aSPierre Jolivet PetscFunctionBegin; 4160ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4161ad7e164aSPierre Jolivet PetscValidType(A, 1); 4162ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4163ad7e164aSPierre Jolivet PetscValidType(B, 2); 4164ad7e164aSPierre Jolivet PetscValidPointer(C, 4); 4165ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4166ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4167ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4168ad7e164aSPierre Jolivet } 4169cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 4170ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4171ad7e164aSPierre Jolivet } 4172ad7e164aSPierre Jolivet 4173d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4174d71ae5a4SJacob Faibussowitsch { 4175ad7e164aSPierre Jolivet Mat newmat; 4176ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4177ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4178ad7e164aSPierre Jolivet PetscScalar *v; 4179fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4180ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4181ad7e164aSPierre Jolivet PetscBool flg; 4182ad7e164aSPierre Jolivet 4183ad7e164aSPierre Jolivet PetscFunctionBegin; 418428b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 418528b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 418628b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 418728b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 41889566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 418928b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4190aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4191ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 41929566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 41939566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 41949566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 41959566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4196ad7e164aSPierre Jolivet i[0] = 0; 4197ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4198ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4199ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4200ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4201ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4202ad7e164aSPierre Jolivet } 4203ad7e164aSPierre Jolivet } 4204ad7e164aSPierre Jolivet } 42059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4206ad7e164aSPierre Jolivet *C = newmat; 42079566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4208ad7e164aSPierre Jolivet nnz = 0; 4209ad7e164aSPierre Jolivet } 42109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4213ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4214ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4215ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4216ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4217ad7e164aSPierre Jolivet } 4218ad7e164aSPierre Jolivet } 4219ad7e164aSPierre Jolivet } 42209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 4223ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4224ad7e164aSPierre Jolivet } 4225ad7e164aSPierre Jolivet 4226c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4227af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4228170fe5c8SBarry Smith 4229170fe5c8SBarry Smith /* 4230170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4231170fe5c8SBarry Smith 4232170fe5c8SBarry Smith n p p 42332da392ccSBarry Smith [ ] [ ] [ ] 42342da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42352da392ccSBarry Smith [ ] [ ] [ ] 4236170fe5c8SBarry Smith 4237170fe5c8SBarry Smith */ 4238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4239d71ae5a4SJacob Faibussowitsch { 4240170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4241170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4242170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 424386214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4244170fe5c8SBarry Smith const PetscInt *ii, *idx; 4245170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4246170fe5c8SBarry Smith PetscScalar *c, *c_q; 424786214ceeSStefano Zampini PetscInt clda = sub_c->lda; 424886214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4249170fe5c8SBarry Smith 4250170fe5c8SBarry Smith PetscFunctionBegin; 4251d0f46423SBarry Smith m = A->rmap->n; 4252d0f46423SBarry Smith n = A->cmap->n; 4253d0f46423SBarry Smith p = B->cmap->n; 4254170fe5c8SBarry Smith a = sub_a->v; 4255170fe5c8SBarry Smith b = sub_b->a; 4256170fe5c8SBarry Smith c = sub_c->v; 425786214ceeSStefano Zampini if (clda == m) { 42589566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 425986214ceeSStefano Zampini } else { 426086214ceeSStefano Zampini for (j = 0; j < p; j++) 42619371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 426286214ceeSStefano Zampini } 4263170fe5c8SBarry Smith ii = sub_b->i; 4264170fe5c8SBarry Smith idx = sub_b->j; 4265170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4266170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4267170fe5c8SBarry Smith while (q-- > 0) { 426886214ceeSStefano Zampini c_q = c + clda * (*idx); 426986214ceeSStefano Zampini a_q = a + alda * i; 4270854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4271170fe5c8SBarry Smith idx++; 4272170fe5c8SBarry Smith b++; 4273170fe5c8SBarry Smith } 4274170fe5c8SBarry Smith } 4275170fe5c8SBarry Smith PetscFunctionReturn(0); 4276170fe5c8SBarry Smith } 4277170fe5c8SBarry Smith 4278d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4279d71ae5a4SJacob Faibussowitsch { 4280d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 428186214ceeSStefano Zampini PetscBool cisdense; 4282170fe5c8SBarry Smith 4283170fe5c8SBarry Smith PetscFunctionBegin; 428408401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 42859566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 42869566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 42879566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, "")); 428848a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 42899566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4290d73949e8SHong Zhang 42914222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 4292170fe5c8SBarry Smith PetscFunctionReturn(0); 4293170fe5c8SBarry Smith } 4294170fe5c8SBarry Smith 4295170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 42960bad9183SKris Buschelman /*MC 4297fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 42980bad9183SKris Buschelman based on compressed sparse row format. 42990bad9183SKris Buschelman 43000bad9183SKris Buschelman Options Database Keys: 43010bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43020bad9183SKris Buschelman 43030bad9183SKris Buschelman Level: beginner 43040bad9183SKris Buschelman 43050cd7f59aSBarry Smith Notes: 430611a5261eSBarry Smith `MatSetValues()` may be called for this matrix type with a NULL argument for the numerical values, 43070cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43080cd7f59aSBarry Smith in the matrix 43090cd7f59aSBarry Smith 431011a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 431111a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43120cd7f59aSBarry Smith 431311a5261eSBarry Smith Developer Note: 43140cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 43150cd7f59aSBarry Smith 4316db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43170bad9183SKris Buschelman M*/ 43180bad9183SKris Buschelman 4319ccd284c7SBarry Smith /*MC 4320ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4321ccd284c7SBarry Smith 432211a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 432311a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 432411a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4325ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4326ccd284c7SBarry Smith the above preallocation routines for simplicity. 4327ccd284c7SBarry Smith 4328ccd284c7SBarry Smith Options Database Keys: 432911a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4330ccd284c7SBarry Smith 433111a5261eSBarry Smith Note: 433211a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4333ccd284c7SBarry Smith enough exist. 4334ccd284c7SBarry Smith 4335ccd284c7SBarry Smith Level: beginner 4336ccd284c7SBarry Smith 4337db781477SPatrick Sanan .seealso: `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4338ccd284c7SBarry Smith M*/ 4339ccd284c7SBarry Smith 4340ccd284c7SBarry Smith /*MC 4341ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4342ccd284c7SBarry Smith 434311a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 434411a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 434511a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4346ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4347ccd284c7SBarry Smith the above preallocation routines for simplicity. 4348ccd284c7SBarry Smith 4349ccd284c7SBarry Smith Options Database Keys: 435011a5261eSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 4351ccd284c7SBarry Smith 4352ccd284c7SBarry Smith Level: beginner 4353ccd284c7SBarry Smith 4354c2e3fba1SPatrick Sanan .seealso: `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4355ccd284c7SBarry Smith M*/ 4356ccd284c7SBarry Smith 43577906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43587906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43597906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43607906f579SHong Zhang #endif 4361d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4362d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4363d24d4204SJose E. Roman #endif 43647906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43657906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43667906f579SHong Zhang #endif 43677906f579SHong Zhang 4368d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4369c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43704222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43717906f579SHong Zhang 43728c778c55SBarry Smith /*@C 437311a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43748c778c55SBarry Smith 43758c778c55SBarry Smith Not Collective 43768c778c55SBarry Smith 43778c778c55SBarry Smith Input Parameter: 437811a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 43798c778c55SBarry Smith 43808c778c55SBarry Smith Output Parameter: 43818c778c55SBarry Smith . array - pointer to the data 43828c778c55SBarry Smith 43838c778c55SBarry Smith Level: intermediate 43848c778c55SBarry Smith 4385db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 43868c778c55SBarry Smith @*/ 4387d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array) 4388d71ae5a4SJacob Faibussowitsch { 4389d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 43908c778c55SBarry Smith 43918c778c55SBarry Smith PetscFunctionBegin; 4392d67d9f35SJunchao Zhang if (aij->ops->getarray) { 43939566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4394d67d9f35SJunchao Zhang } else { 4395d67d9f35SJunchao Zhang *array = aij->a; 4396d67d9f35SJunchao Zhang } 4397d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4398d67d9f35SJunchao Zhang } 4399d67d9f35SJunchao Zhang 4400d67d9f35SJunchao Zhang /*@C 440111a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4402d67d9f35SJunchao Zhang 4403d67d9f35SJunchao Zhang Not Collective 4404d67d9f35SJunchao Zhang 4405d67d9f35SJunchao Zhang Input Parameters: 440611a5261eSBarry Smith + mat - a `MATSEQAIJ` matrix 4407d67d9f35SJunchao Zhang - array - pointer to the data 4408d67d9f35SJunchao Zhang 4409d67d9f35SJunchao Zhang Level: intermediate 4410d67d9f35SJunchao Zhang 4411db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4412d67d9f35SJunchao Zhang @*/ 4413d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array) 4414d71ae5a4SJacob Faibussowitsch { 4415d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4416d67d9f35SJunchao Zhang 4417d67d9f35SJunchao Zhang PetscFunctionBegin; 4418d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44199566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4420d67d9f35SJunchao Zhang } else { 4421d67d9f35SJunchao Zhang *array = NULL; 4422d67d9f35SJunchao Zhang } 44239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44249566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44258c778c55SBarry Smith PetscFunctionReturn(0); 44268c778c55SBarry Smith } 44278c778c55SBarry Smith 442821e72a00SBarry Smith /*@C 442911a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44308f1ea47aSStefano Zampini 44318f1ea47aSStefano Zampini Not Collective 44328f1ea47aSStefano Zampini 44338f1ea47aSStefano Zampini Input Parameter: 443411a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44358f1ea47aSStefano Zampini 44368f1ea47aSStefano Zampini Output Parameter: 44378f1ea47aSStefano Zampini . array - pointer to the data 44388f1ea47aSStefano Zampini 44398f1ea47aSStefano Zampini Level: intermediate 44408f1ea47aSStefano Zampini 4441db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44428f1ea47aSStefano Zampini @*/ 4443d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array) 4444d71ae5a4SJacob Faibussowitsch { 4445d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44468f1ea47aSStefano Zampini 44478f1ea47aSStefano Zampini PetscFunctionBegin; 4448d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44499566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4450d67d9f35SJunchao Zhang } else { 4451d67d9f35SJunchao Zhang *array = aij->a; 4452d67d9f35SJunchao Zhang } 44538f1ea47aSStefano Zampini PetscFunctionReturn(0); 44548f1ea47aSStefano Zampini } 44558f1ea47aSStefano Zampini 44568f1ea47aSStefano Zampini /*@C 445711a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44588f1ea47aSStefano Zampini 44598f1ea47aSStefano Zampini Not Collective 44608f1ea47aSStefano Zampini 44618f1ea47aSStefano Zampini Input Parameter: 446211a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44638f1ea47aSStefano Zampini 44648f1ea47aSStefano Zampini Output Parameter: 44658f1ea47aSStefano Zampini . array - pointer to the data 44668f1ea47aSStefano Zampini 44678f1ea47aSStefano Zampini Level: intermediate 44688f1ea47aSStefano Zampini 4469db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44708f1ea47aSStefano Zampini @*/ 4471d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array) 4472d71ae5a4SJacob Faibussowitsch { 4473d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44748f1ea47aSStefano Zampini 44758f1ea47aSStefano Zampini PetscFunctionBegin; 4476d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44779566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4478d67d9f35SJunchao Zhang } else { 4479d67d9f35SJunchao Zhang *array = NULL; 4480d67d9f35SJunchao Zhang } 4481d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4482d67d9f35SJunchao Zhang } 4483d67d9f35SJunchao Zhang 4484d67d9f35SJunchao Zhang /*@C 448511a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4486d67d9f35SJunchao Zhang 4487d67d9f35SJunchao Zhang Not Collective 4488d67d9f35SJunchao Zhang 4489d67d9f35SJunchao Zhang Input Parameter: 449011a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 4491d67d9f35SJunchao Zhang 4492d67d9f35SJunchao Zhang Output Parameter: 4493d67d9f35SJunchao Zhang . array - pointer to the data 4494d67d9f35SJunchao Zhang 4495d67d9f35SJunchao Zhang Level: intermediate 4496d67d9f35SJunchao Zhang 4497db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4498d67d9f35SJunchao Zhang @*/ 4499d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array) 4500d71ae5a4SJacob Faibussowitsch { 4501d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4502d67d9f35SJunchao Zhang 4503d67d9f35SJunchao Zhang PetscFunctionBegin; 4504d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45059566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4506d67d9f35SJunchao Zhang } else { 4507d67d9f35SJunchao Zhang *array = aij->a; 4508d67d9f35SJunchao Zhang } 45099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45109566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 4511d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4512d67d9f35SJunchao Zhang } 4513d67d9f35SJunchao Zhang 4514d67d9f35SJunchao Zhang /*@C 4515d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4516d67d9f35SJunchao Zhang 4517d67d9f35SJunchao Zhang Not Collective 4518d67d9f35SJunchao Zhang 4519d67d9f35SJunchao Zhang Input Parameter: 4520d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4521d67d9f35SJunchao Zhang 4522d67d9f35SJunchao Zhang Output Parameter: 4523d67d9f35SJunchao Zhang . array - pointer to the data 4524d67d9f35SJunchao Zhang 4525d67d9f35SJunchao Zhang Level: intermediate 4526d67d9f35SJunchao Zhang 4527db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4528d67d9f35SJunchao Zhang @*/ 4529d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array) 4530d71ae5a4SJacob Faibussowitsch { 4531d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4532d67d9f35SJunchao Zhang 4533d67d9f35SJunchao Zhang PetscFunctionBegin; 4534d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45359566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4536d67d9f35SJunchao Zhang } else { 4537d67d9f35SJunchao Zhang *array = NULL; 4538d67d9f35SJunchao Zhang } 45398f1ea47aSStefano Zampini PetscFunctionReturn(0); 45408f1ea47aSStefano Zampini } 45418f1ea47aSStefano Zampini 45428f1ea47aSStefano Zampini /*@C 454311a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45447ee59b9bSJunchao Zhang 45457ee59b9bSJunchao Zhang Not Collective 45467ee59b9bSJunchao Zhang 45477ee59b9bSJunchao Zhang Input Parameter: 454811a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45497ee59b9bSJunchao Zhang 45507ee59b9bSJunchao Zhang Output Parameters: 45517ee59b9bSJunchao Zhang + i - row map array of the matrix 45527ee59b9bSJunchao Zhang . j - column index array of the matrix 45537ee59b9bSJunchao Zhang . a - data array of the matrix 45547ee59b9bSJunchao Zhang - memtype - memory type of the arrays 45557ee59b9bSJunchao Zhang 45567ee59b9bSJunchao Zhang Notes: 45577ee59b9bSJunchao Zhang Any of the output parameters can be NULL, in which case the corresponding value is not returned. 45587ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45597ee59b9bSJunchao Zhang 45607ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45617ee59b9bSJunchao Zhang If the matrix is assembled, the data array 'a' is guaranteed to have the latest values of the matrix. 45627ee59b9bSJunchao Zhang 45637ee59b9bSJunchao Zhang Level: Developer 45647ee59b9bSJunchao Zhang 4565db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45667ee59b9bSJunchao Zhang @*/ 4567d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype) 4568d71ae5a4SJacob Faibussowitsch { 45697ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45707ee59b9bSJunchao Zhang 45717ee59b9bSJunchao Zhang PetscFunctionBegin; 45727ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45737ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45747ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45757ee59b9bSJunchao Zhang } else { 45767ee59b9bSJunchao Zhang if (i) *i = aij->i; 45777ee59b9bSJunchao Zhang if (j) *j = aij->j; 45787ee59b9bSJunchao Zhang if (a) *a = aij->a; 45797ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 45807ee59b9bSJunchao Zhang } 45817ee59b9bSJunchao Zhang PetscFunctionReturn(0); 45827ee59b9bSJunchao Zhang } 45837ee59b9bSJunchao Zhang 45847ee59b9bSJunchao Zhang /*@C 458521e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 458621e72a00SBarry Smith 458721e72a00SBarry Smith Not Collective 458821e72a00SBarry Smith 458921e72a00SBarry Smith Input Parameter: 459011a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 459121e72a00SBarry Smith 459221e72a00SBarry Smith Output Parameter: 459321e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 459421e72a00SBarry Smith 459521e72a00SBarry Smith Level: intermediate 459621e72a00SBarry Smith 4597db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 459821e72a00SBarry Smith @*/ 4599d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4600d71ae5a4SJacob Faibussowitsch { 460121e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 460221e72a00SBarry Smith 460321e72a00SBarry Smith PetscFunctionBegin; 460421e72a00SBarry Smith *nz = aij->rmax; 460521e72a00SBarry Smith PetscFunctionReturn(0); 460621e72a00SBarry Smith } 460721e72a00SBarry Smith 4608d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4609d71ae5a4SJacob Faibussowitsch { 4610394ed5ebSJunchao Zhang MPI_Comm comm; 4611394ed5ebSJunchao Zhang PetscInt *i, *j; 4612394ed5ebSJunchao Zhang PetscInt M, N, row; 4613394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4614394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4615394ed5ebSJunchao Zhang PetscInt *Aj; 4616394ed5ebSJunchao Zhang PetscScalar *Aa; 4617cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)(mat->data); 4618cbc6b225SStefano Zampini MatType rtype; 4619394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 4620394ed5ebSJunchao Zhang 4621394ed5ebSJunchao Zhang PetscFunctionBegin; 46229566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(mat)); 46239566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46249566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4625e8729f6fSJunchao Zhang i = coo_i; 4626e8729f6fSJunchao Zhang j = coo_j; 46279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 4628394ed5ebSJunchao Zhang for (k = 0; k < coo_n; k++) { /* Ignore entries with negative row or col indices */ 4629394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4630394ed5ebSJunchao Zhang perm[k] = k; 4631394ed5ebSJunchao Zhang } 4632394ed5ebSJunchao Zhang 4633394ed5ebSJunchao Zhang /* Sort by row */ 46349566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 46359371c9d4SSatish Balay for (k = 0; k < coo_n; k++) { 46369371c9d4SSatish Balay if (i[k] >= 0) break; 46379371c9d4SSatish Balay } /* Advance k to the first row with a non-negative index */ 4638394ed5ebSJunchao Zhang nneg = k; 46399566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4640394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 464135cb6cd3SPierre Jolivet jmap++; /* Inc jmap by 1 for convenience */ 4642394ed5ebSJunchao Zhang 46439566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M + 1, &Ai)); /* CSR of A */ 46449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4645394ed5ebSJunchao Zhang 4646394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 464735cb6cd3SPierre Jolivet Ai++; /* Inc by 1 for convenience */ 4648394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4649394ed5ebSJunchao Zhang while (k < coo_n) { 4650394ed5ebSJunchao Zhang row = i[k]; 4651394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4652394ed5ebSJunchao Zhang while (k < coo_n && i[k] == row) k++; 4653394ed5ebSJunchao Zhang end = k; 46549566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4655394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4656394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4657394ed5ebSJunchao Zhang jmap[q] = 1; /* Number of repeats of this nozero entry */ 4658394ed5ebSJunchao Zhang Ai[row] = 1; 4659394ed5ebSJunchao Zhang nnz++; 4660394ed5ebSJunchao Zhang 4661394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4662394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4663394ed5ebSJunchao Zhang q++; 4664394ed5ebSJunchao Zhang jmap[q] = 1; 4665394ed5ebSJunchao Zhang Aj[q] = j[p]; 4666394ed5ebSJunchao Zhang Ai[row]++; 4667394ed5ebSJunchao Zhang nnz++; 4668394ed5ebSJunchao Zhang } else { 4669394ed5ebSJunchao Zhang jmap[q]++; 4670394ed5ebSJunchao Zhang } 4671394ed5ebSJunchao Zhang } 4672394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4673394ed5ebSJunchao Zhang } 4674394ed5ebSJunchao Zhang 4675394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4676394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 4677394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4678394ed5ebSJunchao Zhang jmap[0] = 0; 4679394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 4680394ed5ebSJunchao Zhang if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */ 4681394ed5ebSJunchao Zhang PetscCount *jmap_new; 4682394ed5ebSJunchao Zhang PetscInt *Aj_new; 4683394ed5ebSJunchao Zhang 46849566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 46859566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 46869566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4687394ed5ebSJunchao Zhang jmap = jmap_new; 4688394ed5ebSJunchao Zhang 46899566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &Aj_new)); 46909566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 46919566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4692394ed5ebSJunchao Zhang Aj = Aj_new; 4693394ed5ebSJunchao Zhang } 4694394ed5ebSJunchao Zhang 4695394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4696394ed5ebSJunchao Zhang PetscCount *perm_new; 4697cbc6b225SStefano Zampini 46989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 46999566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 47009566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4701394ed5ebSJunchao Zhang perm = perm_new; 4702394ed5ebSJunchao Zhang } 4703394ed5ebSJunchao Zhang 47049566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 47059566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */ 47069566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4707394ed5ebSJunchao Zhang 4708394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4709394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 4710394ed5ebSJunchao Zhang /* Record COO fields */ 4711394ed5ebSJunchao Zhang seqaij->coo_n = coo_n; 4712394ed5ebSJunchao Zhang seqaij->Atot = coo_n - nneg; /* Annz is seqaij->nz, so no need to record that again */ 4713394ed5ebSJunchao Zhang seqaij->jmap = jmap; /* of length nnz+1 */ 4714394ed5ebSJunchao Zhang seqaij->perm = perm; 4715394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4716394ed5ebSJunchao Zhang } 4717394ed5ebSJunchao Zhang 4718d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4719d71ae5a4SJacob Faibussowitsch { 4720394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4721394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 4722394ed5ebSJunchao Zhang PetscCount *perm = aseq->perm, *jmap = aseq->jmap; 4723394ed5ebSJunchao Zhang PetscScalar *Aa; 4724394ed5ebSJunchao Zhang 4725394ed5ebSJunchao Zhang PetscFunctionBegin; 47269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4727394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4728b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4729b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4730b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4731394ed5ebSJunchao Zhang } 47329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 4733394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4734394ed5ebSJunchao Zhang } 4735394ed5ebSJunchao Zhang 473634b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47375063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 473802fe1965SBarry Smith #endif 47393d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47405063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 47413d0639e7SStefano Zampini #endif 474202fe1965SBarry Smith 4743d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4744d71ae5a4SJacob Faibussowitsch { 4745273d9f13SBarry Smith Mat_SeqAIJ *b; 474638baddfdSBarry Smith PetscMPIInt size; 4747273d9f13SBarry Smith 4748273d9f13SBarry Smith PetscFunctionBegin; 47499566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 475008401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4751273d9f13SBarry Smith 47524dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 47532205254eSKarl Rupp 4754b0a32e0cSBarry Smith B->data = (void *)b; 47552205254eSKarl Rupp 47569566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps))); 4757071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 47582205254eSKarl Rupp 4759f4259b30SLisandro Dalcin b->row = NULL; 4760f4259b30SLisandro Dalcin b->col = NULL; 4761f4259b30SLisandro Dalcin b->icol = NULL; 4762b810aeb4SBarry Smith b->reallocs = 0; 476336db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4764f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4765416022c9SBarry Smith b->nonew = 0; 4766f4259b30SLisandro Dalcin b->diag = NULL; 4767f4259b30SLisandro Dalcin b->solve_work = NULL; 4768f4259b30SLisandro Dalcin B->spptr = NULL; 4769f4259b30SLisandro Dalcin b->saved_values = NULL; 4770f4259b30SLisandro Dalcin b->idiag = NULL; 4771f4259b30SLisandro Dalcin b->mdiag = NULL; 4772f4259b30SLisandro Dalcin b->ssor_work = NULL; 477371f1c65dSBarry Smith b->omega = 1.0; 477471f1c65dSBarry Smith b->fshift = 0.0; 477571f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4776bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4777a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 477817ab2063SBarry Smith 47799566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4780d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 47819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 47829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4783b3866ffcSBarry Smith #endif 47849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 47859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 47869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 47879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 47889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 47899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 47909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 47919779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 47929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4793191b95cbSRichard Tran Mills #endif 479434b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 47969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 47979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 479802fe1965SBarry Smith #endif 47993d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 48013d0639e7SStefano Zampini #endif 48029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4803af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 48049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4805af8000cdSHong Zhang #endif 4806d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 48079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4808d24d4204SJose E. Roman #endif 480963c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 48109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 48119566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 481263c07aadSStefano Zampini #endif 48139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 48149566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 48159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 48169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 48179566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsTranspose_SeqAIJ)); 48189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 48199566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 48209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 48219566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 48229566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 48239566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 48249566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48259566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 48269566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 48279566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 48289566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 48299566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 48309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 48313a40ed3dSBarry Smith PetscFunctionReturn(0); 483217ab2063SBarry Smith } 483317ab2063SBarry Smith 4834b24902e0SBarry Smith /* 48353893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4836b24902e0SBarry Smith */ 4837d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4838d71ae5a4SJacob Faibussowitsch { 48392a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4840071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 484117ab2063SBarry Smith 48423a40ed3dSBarry Smith PetscFunctionBegin; 4843aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4844273d9f13SBarry Smith 4845d5f3da31SBarry Smith C->factortype = A->factortype; 4846f4259b30SLisandro Dalcin c->row = NULL; 4847f4259b30SLisandro Dalcin c->col = NULL; 4848f4259b30SLisandro Dalcin c->icol = NULL; 48496ad4291fSHong Zhang c->reallocs = 0; 485017ab2063SBarry Smith 485169272f91SPierre Jolivet C->assembled = A->assembled; 485269272f91SPierre Jolivet C->preallocated = A->preallocated; 485317ab2063SBarry Smith 485469272f91SPierre Jolivet if (A->preallocated) { 48559566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 48569566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4857eec197d1SBarry Smith 48589566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 48599566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 48609566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 48619566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 486217ab2063SBarry Smith 486317ab2063SBarry Smith /* allocate the matrix space */ 4864f77e22a1SHong Zhang if (mallocmatspace) { 48659566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i)); 48662205254eSKarl Rupp 4867f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 48682205254eSKarl Rupp 48699566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 487017ab2063SBarry Smith if (m > 0) { 48719566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4872be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 48732e5835c6SStefano Zampini const PetscScalar *aa; 48742e5835c6SStefano Zampini 48759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 48769566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 48779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 4878be6bf707SBarry Smith } else { 48799566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 488017ab2063SBarry Smith } 488108480c60SBarry Smith } 4882f77e22a1SHong Zhang } 488317ab2063SBarry Smith 48846ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4885416022c9SBarry Smith c->roworiented = a->roworiented; 4886416022c9SBarry Smith c->nonew = a->nonew; 4887416022c9SBarry Smith if (a->diag) { 48889566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 48899566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 4890071fcb05SBarry Smith } else c->diag = NULL; 48912205254eSKarl Rupp 4892f4259b30SLisandro Dalcin c->solve_work = NULL; 4893f4259b30SLisandro Dalcin c->saved_values = NULL; 4894f4259b30SLisandro Dalcin c->idiag = NULL; 4895f4259b30SLisandro Dalcin c->ssor_work = NULL; 4896a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4897e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4898e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 48996ad4291fSHong Zhang 4900893ad86cSHong Zhang c->rmax = a->rmax; 4901416022c9SBarry Smith c->nz = a->nz; 49028ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4903754ec7b1SSatish Balay 49046ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 49056ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4906cd6b891eSBarry Smith if (a->compressedrow.use) { 49076ad4291fSHong Zhang i = a->compressedrow.nrows; 49089566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 49099566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 49109566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 491127ea64f8SHong Zhang } else { 491227ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 49130298fd71SBarry Smith c->compressedrow.i = NULL; 49140298fd71SBarry Smith c->compressedrow.rindex = NULL; 49156ad4291fSHong Zhang } 4916ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4917e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 49184846f1f5SKris Buschelman 49199566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 492069272f91SPierre Jolivet } 49219566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 49223a40ed3dSBarry Smith PetscFunctionReturn(0); 492317ab2063SBarry Smith } 492417ab2063SBarry Smith 4925d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 4926d71ae5a4SJacob Faibussowitsch { 4927b24902e0SBarry Smith PetscFunctionBegin; 49289566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 49299566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 493048a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 49319566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 49329566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 4933b24902e0SBarry Smith PetscFunctionReturn(0); 4934b24902e0SBarry Smith } 4935b24902e0SBarry Smith 4936d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4937d71ae5a4SJacob Faibussowitsch { 493852f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 493952f91c60SVaclav Hapla 494052f91c60SVaclav Hapla PetscFunctionBegin; 494152f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 494252f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 4943c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 49449566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 49459566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 49469566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 494752f91c60SVaclav Hapla if (isbinary) { 49489566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 494952f91c60SVaclav Hapla } else if (ishdf5) { 495052f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 49519566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 495252f91c60SVaclav Hapla #else 495352f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 495452f91c60SVaclav Hapla #endif 495552f91c60SVaclav Hapla } else { 495698921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 495752f91c60SVaclav Hapla } 495852f91c60SVaclav Hapla PetscFunctionReturn(0); 495952f91c60SVaclav Hapla } 496052f91c60SVaclav Hapla 4961d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 4962d71ae5a4SJacob Faibussowitsch { 49633ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 49643ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 4965fbdbba38SShri Abhyankar 4966fbdbba38SShri Abhyankar PetscFunctionBegin; 49679566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 4968bbead8a2SBarry Smith 49693ea6fe3dSLisandro Dalcin /* read in matrix header */ 49709566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 497108401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 49729371c9d4SSatish Balay M = header[1]; 49739371c9d4SSatish Balay N = header[2]; 49749371c9d4SSatish Balay nz = header[3]; 497508401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 497608401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 497708401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 4978fbdbba38SShri Abhyankar 49793ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 49809566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 49813ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 49823ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 49833ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 49843ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 49853ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 49869566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 49879566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 49883ea6fe3dSLisandro Dalcin 49893ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 49909566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 4991aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 49923ea6fe3dSLisandro Dalcin 4993fbdbba38SShri Abhyankar /* read in row lengths */ 49949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 49959566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 49963ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 49979371c9d4SSatish Balay sum = 0; 49989371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 499908401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 50003ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 50019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 50029566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5003aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 50043ea6fe3dSLisandro Dalcin /* store row lengths */ 50059566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 50069566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5007fbdbba38SShri Abhyankar 50083ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 50099371c9d4SSatish Balay a->i[0] = 0; 50109371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 50113ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 50129566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 50133ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 50149566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5015fbdbba38SShri Abhyankar 50169566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 50179566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 5018fbdbba38SShri Abhyankar PetscFunctionReturn(0); 5019fbdbba38SShri Abhyankar } 5020fbdbba38SShri Abhyankar 5021d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5022d71ae5a4SJacob Faibussowitsch { 50237264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5024fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5025eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5026eeffb40dSHong Zhang PetscInt k; 5027eeffb40dSHong Zhang #endif 50287264ac53SSatish Balay 50293a40ed3dSBarry Smith PetscFunctionBegin; 5030bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5031d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5032ca44d042SBarry Smith *flg = PETSC_FALSE; 5033ca44d042SBarry Smith PetscFunctionReturn(0); 5034bcd2baecSBarry Smith } 50357264ac53SSatish Balay 50367264ac53SSatish Balay /* if the a->i are the same */ 50379566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 5038abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 50397264ac53SSatish Balay 50407264ac53SSatish Balay /* if a->j are the same */ 50419566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 5042abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 5043bcd2baecSBarry Smith 50449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5046bcd2baecSBarry Smith /* if a->a are the same */ 5047eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5048eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5049fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5050eeffb40dSHong Zhang *flg = PETSC_FALSE; 50513a40ed3dSBarry Smith PetscFunctionReturn(0); 5052eeffb40dSHong Zhang } 5053eeffb40dSHong Zhang } 5054eeffb40dSHong Zhang #else 50559566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5056eeffb40dSHong Zhang #endif 50579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 50589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 5059eeffb40dSHong Zhang PetscFunctionReturn(0); 50607264ac53SSatish Balay } 506136db0b34SBarry Smith 506205869f15SSatish Balay /*@ 506311a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 506436db0b34SBarry Smith provided by the user. 506536db0b34SBarry Smith 5066d083f849SBarry Smith Collective 506736db0b34SBarry Smith 506836db0b34SBarry Smith Input Parameters: 506936db0b34SBarry Smith + comm - must be an MPI communicator of size 1 507036db0b34SBarry Smith . m - number of rows 507136db0b34SBarry Smith . n - number of columns 5072483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 507336db0b34SBarry Smith . j - column indices 507436db0b34SBarry Smith - a - matrix values 507536db0b34SBarry Smith 507636db0b34SBarry Smith Output Parameter: 507736db0b34SBarry Smith . mat - the matrix 507836db0b34SBarry Smith 507936db0b34SBarry Smith Level: intermediate 508036db0b34SBarry Smith 508136db0b34SBarry Smith Notes: 50820551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 5083292fb18eSBarry Smith once the matrix is destroyed and not before 508436db0b34SBarry Smith 508536db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 508636db0b34SBarry Smith 5087bfeeae90SHong Zhang The i and j indices are 0 based 508836db0b34SBarry Smith 5089a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5090a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 50918eef79e4SBarry Smith as shown 5092a4552177SSatish Balay 50938eef79e4SBarry Smith $ 1 0 0 50948eef79e4SBarry Smith $ 2 0 3 50958eef79e4SBarry Smith $ 4 5 6 50968eef79e4SBarry Smith $ 50978eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 50988eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 50998eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 5100a4552177SSatish Balay 5101db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 510236db0b34SBarry Smith @*/ 5103d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5104d71ae5a4SJacob Faibussowitsch { 5105cbcfb4deSHong Zhang PetscInt ii; 510636db0b34SBarry Smith Mat_SeqAIJ *aij; 5107cbcfb4deSHong Zhang PetscInt jj; 510836db0b34SBarry Smith 510936db0b34SBarry Smith PetscFunctionBegin; 5110aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 51119566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51129566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51139566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 51149566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5116ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 51179566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 51189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5119ab93d7beSBarry Smith 512036db0b34SBarry Smith aij->i = i; 512136db0b34SBarry Smith aij->j = j; 512236db0b34SBarry Smith aij->a = a; 512336db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 512436db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5125e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5126e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 512736db0b34SBarry Smith 5128cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 512936db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 513076bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5131aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 51329985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 513308401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 513408401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 51359985e31cSBarry Smith } 513636db0b34SBarry Smith } 513776bd3646SJed Brown } 513876bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 513936db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 514008401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5141aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 514236db0b34SBarry Smith } 514376bd3646SJed Brown } 514436db0b34SBarry Smith 51459566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 51469566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 514736db0b34SBarry Smith PetscFunctionReturn(0); 514836db0b34SBarry Smith } 5149cbc6b225SStefano Zampini 5150f62e3866SBarry Smith /*@ 515111a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 51528a0b0e6bSVictor Minden provided by the user. 51538a0b0e6bSVictor Minden 5154d083f849SBarry Smith Collective 51558a0b0e6bSVictor Minden 51568a0b0e6bSVictor Minden Input Parameters: 51578a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 51588a0b0e6bSVictor Minden . m - number of rows 51598a0b0e6bSVictor Minden . n - number of columns 51608a0b0e6bSVictor Minden . i - row indices 51618a0b0e6bSVictor Minden . j - column indices 51621230e6d1SVictor Minden . a - matrix values 51631230e6d1SVictor Minden . nz - number of nonzeros 516411a5261eSBarry Smith - idx - if the i and j indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 51658a0b0e6bSVictor Minden 51668a0b0e6bSVictor Minden Output Parameter: 51678a0b0e6bSVictor Minden . mat - the matrix 51688a0b0e6bSVictor Minden 51698a0b0e6bSVictor Minden Level: intermediate 51708a0b0e6bSVictor Minden 5171f62e3866SBarry Smith Example: 5172f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 51739e99939fSJunchao Zhang .vb 51748a0b0e6bSVictor Minden 1 0 0 51758a0b0e6bSVictor Minden 2 0 3 51768a0b0e6bSVictor Minden 4 5 6 51778a0b0e6bSVictor Minden 51788a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 51798a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 51808a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 51819e99939fSJunchao Zhang .ve 5182d7547e51SJunchao Zhang Notes: 5183d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5184d7547e51SJunchao Zhang and are particularly useful in iterative applications. 51858a0b0e6bSVictor Minden 5186d7547e51SJunchao Zhang .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 51878a0b0e6bSVictor Minden @*/ 5188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5189d71ae5a4SJacob Faibussowitsch { 5190d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 51918a0b0e6bSVictor Minden 51928a0b0e6bSVictor Minden PetscFunctionBegin; 51939566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5194ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 51959566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51969566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51979566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 51991230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 52001230e6d1SVictor Minden if (idx) { 52011230e6d1SVictor Minden row = i[ii] - 1; 52021230e6d1SVictor Minden col = j[ii] - 1; 52031230e6d1SVictor Minden } else { 52041230e6d1SVictor Minden row = i[ii]; 52051230e6d1SVictor Minden col = j[ii]; 52068a0b0e6bSVictor Minden } 52079566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 52088a0b0e6bSVictor Minden } 52099566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52109566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52119566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 52128a0b0e6bSVictor Minden PetscFunctionReturn(0); 52138a0b0e6bSVictor Minden } 521436db0b34SBarry Smith 5215d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5216d71ae5a4SJacob Faibussowitsch { 5217acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5218acf2f550SJed Brown 5219acf2f550SJed Brown PetscFunctionBegin; 5220acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5221acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 52222205254eSKarl Rupp 52239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 5224acf2f550SJed Brown PetscFunctionReturn(0); 5225acf2f550SJed Brown } 5226acf2f550SJed Brown 5227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5228d71ae5a4SJacob Faibussowitsch { 52299c8f2541SHong Zhang PetscFunctionBegin; 52309566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 52319c8f2541SHong Zhang PetscFunctionReturn(0); 52329c8f2541SHong Zhang } 52339c8f2541SHong Zhang 523481824310SBarry Smith /* 523553dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 523653dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 523753dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 523853dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 523953dd7562SDmitry Karpeev */ 5240d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5241d71ae5a4SJacob Faibussowitsch { 524253dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 524353dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 524453dd7562SDmitry Karpeev PetscBool seqaij; 524553dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 524653dd7562SDmitry Karpeev PetscScalar v; 524753dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 524853dd7562SDmitry Karpeev 524953dd7562SDmitry Karpeev PetscFunctionBegin; 525053dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 525153dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 52529566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 525328b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 525453dd7562SDmitry Karpeev if (rowemb) { 52559566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 525608401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 525753dd7562SDmitry Karpeev } else { 525808401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 525953dd7562SDmitry Karpeev } 526053dd7562SDmitry Karpeev if (colemb) { 52619566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 526208401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 526353dd7562SDmitry Karpeev } else { 526408401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 526553dd7562SDmitry Karpeev } 526653dd7562SDmitry Karpeev 526753dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ *)(B->data); 526853dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 52699566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5270ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 52719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 52729566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 527353dd7562SDmitry Karpeev } 527448a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 527553dd7562SDmitry Karpeev count = 0; 527653dd7562SDmitry Karpeev rowindices = NULL; 527753dd7562SDmitry Karpeev colindices = NULL; 527848a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 527948a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 528053dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 528153dd7562SDmitry Karpeev PetscInt row; 528253dd7562SDmitry Karpeev row = i; 528353dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 528453dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 528553dd7562SDmitry Karpeev PetscInt col; 528653dd7562SDmitry Karpeev col = Baij->j[count]; 528753dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 528853dd7562SDmitry Karpeev v = Baij->a[count]; 52899566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 529053dd7562SDmitry Karpeev ++count; 529153dd7562SDmitry Karpeev } 529253dd7562SDmitry Karpeev } 529353dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 529453dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 529553dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 529653dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 529753dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 529853dd7562SDmitry Karpeev PetscFunctionReturn(0); 529953dd7562SDmitry Karpeev } 530053dd7562SDmitry Karpeev 53014099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 53024099cc6bSBarry Smith 53034099cc6bSBarry Smith /*@C 530411a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 53054099cc6bSBarry Smith 5306c3339decSBarry Smith Collective 53074099cc6bSBarry Smith 53084099cc6bSBarry Smith Input Parameters: 53094099cc6bSBarry Smith + mat - the matrix object 53104099cc6bSBarry Smith - matype - matrix type 53114099cc6bSBarry Smith 53124099cc6bSBarry Smith Options Database Key: 53134099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 53144099cc6bSBarry Smith 53154099cc6bSBarry Smith Level: intermediate 53164099cc6bSBarry Smith 5317db781477SPatrick Sanan .seealso: `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`, `Mat` 53184099cc6bSBarry Smith @*/ 5319d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5320d71ae5a4SJacob Faibussowitsch { 53214099cc6bSBarry Smith PetscBool sametype; 53225f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 53234099cc6bSBarry Smith 53244099cc6bSBarry Smith PetscFunctionBegin; 53254099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 53269566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 53274099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 53284099cc6bSBarry Smith 53299566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 53305f80ce2aSJacob Faibussowitsch PetscCheck(r, PETSC_COMM_SELF, PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 53319566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 53324099cc6bSBarry Smith PetscFunctionReturn(0); 53334099cc6bSBarry Smith } 53344099cc6bSBarry Smith 53354099cc6bSBarry Smith /*@C 533611a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 53374099cc6bSBarry Smith 53384099cc6bSBarry Smith Not Collective 53394099cc6bSBarry Smith 53404099cc6bSBarry Smith Input Parameters: 534111a5261eSBarry Smith + name - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 53424099cc6bSBarry Smith - function - routine to convert to subtype 53434099cc6bSBarry Smith 53444099cc6bSBarry Smith Notes: 534511a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 53464099cc6bSBarry Smith 53474099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 53484099cc6bSBarry Smith $ -mat_seqaij_type my_mat 53494099cc6bSBarry Smith 53504099cc6bSBarry Smith Level: advanced 53514099cc6bSBarry Smith 5352db781477SPatrick Sanan .seealso: `MatSeqAIJRegisterAll()` 53534099cc6bSBarry Smith @*/ 5354d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5355d71ae5a4SJacob Faibussowitsch { 53564099cc6bSBarry Smith PetscFunctionBegin; 53579566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 53589566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 53594099cc6bSBarry Smith PetscFunctionReturn(0); 53604099cc6bSBarry Smith } 53614099cc6bSBarry Smith 53624099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 53634099cc6bSBarry Smith 53644099cc6bSBarry Smith /*@C 536511a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 53664099cc6bSBarry Smith 53674099cc6bSBarry Smith Not Collective 53684099cc6bSBarry Smith 53694099cc6bSBarry Smith Level: advanced 53704099cc6bSBarry Smith 5371db781477SPatrick Sanan .seealso: `MatRegisterAll()`, `MatSeqAIJRegister()` 53724099cc6bSBarry Smith @*/ 5373d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5374d71ae5a4SJacob Faibussowitsch { 53754099cc6bSBarry Smith PetscFunctionBegin; 53764099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 53774099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 53784099cc6bSBarry Smith 53799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 53809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 53819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 53829779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 53839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5384485f9817SRichard Tran Mills #endif 53855063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 53869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 53875063d097SStefano Zampini #endif 53885063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 53899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 53905063d097SStefano Zampini #endif 53914099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 53929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 53934099cc6bSBarry Smith #endif 53944099cc6bSBarry Smith PetscFunctionReturn(0); 53954099cc6bSBarry Smith } 539653dd7562SDmitry Karpeev 539753dd7562SDmitry Karpeev /* 539881824310SBarry Smith Special version for direct calls from Fortran 539981824310SBarry Smith */ 5400af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 540181824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 540281824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 540381824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 540481824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 540581824310SBarry Smith #endif 540681824310SBarry Smith 540781824310SBarry Smith /* Change these macros so can be used in void function */ 540898921bdaSJacob Faibussowitsch 540998921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 54109566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 54119566063dSJacob Faibussowitsch #undef PetscCall 54129371c9d4SSatish Balay #define PetscCall(...) \ 54139371c9d4SSatish Balay do { \ 54145f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 541598921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 541698921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 541798921bdaSJacob Faibussowitsch return; \ 541898921bdaSJacob Faibussowitsch } \ 541998921bdaSJacob Faibussowitsch } while (0) 542098921bdaSJacob Faibussowitsch 542198921bdaSJacob Faibussowitsch #undef SETERRQ 54229371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 54239371c9d4SSatish Balay do { \ 542498921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 542598921bdaSJacob Faibussowitsch return; \ 542698921bdaSJacob Faibussowitsch } while (0) 542781824310SBarry Smith 5428d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5429d71ae5a4SJacob Faibussowitsch { 543081824310SBarry Smith Mat A = *AA; 543181824310SBarry Smith PetscInt m = *mm, n = *nn; 543281824310SBarry Smith InsertMode is = *isis; 543381824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 543481824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 543581824310SBarry Smith PetscInt *imax, *ai, *ailen; 543681824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 543754f21887SBarry Smith MatScalar *ap, value, *aa; 5438ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5439ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 544081824310SBarry Smith 544181824310SBarry Smith PetscFunctionBegin; 54424994cf47SJed Brown MatCheckPreallocated(A, 1); 544381824310SBarry Smith imax = a->imax; 544481824310SBarry Smith ai = a->i; 544581824310SBarry Smith ailen = a->ilen; 544681824310SBarry Smith aj = a->j; 544781824310SBarry Smith aa = a->a; 544881824310SBarry Smith 544981824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 545081824310SBarry Smith row = im[k]; 545181824310SBarry Smith if (row < 0) continue; 54525f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 54539371c9d4SSatish Balay rp = aj + ai[row]; 54549371c9d4SSatish Balay ap = aa + ai[row]; 54559371c9d4SSatish Balay rmax = imax[row]; 54569371c9d4SSatish Balay nrow = ailen[row]; 545781824310SBarry Smith low = 0; 545881824310SBarry Smith high = nrow; 545981824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 546081824310SBarry Smith if (in[l] < 0) continue; 54615f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 546281824310SBarry Smith col = in[l]; 54632205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 54642205254eSKarl Rupp else value = v[k + l * m]; 54652205254eSKarl Rupp 546681824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 546781824310SBarry Smith 54682205254eSKarl Rupp if (col <= lastcol) low = 0; 54692205254eSKarl Rupp else high = nrow; 547081824310SBarry Smith lastcol = col; 547181824310SBarry Smith while (high - low > 5) { 547281824310SBarry Smith t = (low + high) / 2; 547381824310SBarry Smith if (rp[t] > col) high = t; 547481824310SBarry Smith else low = t; 547581824310SBarry Smith } 547681824310SBarry Smith for (i = low; i < high; i++) { 547781824310SBarry Smith if (rp[i] > col) break; 547881824310SBarry Smith if (rp[i] == col) { 547981824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 548081824310SBarry Smith else ap[i] = value; 548181824310SBarry Smith goto noinsert; 548281824310SBarry Smith } 548381824310SBarry Smith } 548481824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 548581824310SBarry Smith if (nonew == 1) goto noinsert; 54865f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5487fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 54889371c9d4SSatish Balay N = nrow++ - 1; 54899371c9d4SSatish Balay a->nz++; 54909371c9d4SSatish Balay high++; 549181824310SBarry Smith /* shift up all the later entries in this row */ 549281824310SBarry Smith for (ii = N; ii >= i; ii--) { 549381824310SBarry Smith rp[ii + 1] = rp[ii]; 549481824310SBarry Smith ap[ii + 1] = ap[ii]; 549581824310SBarry Smith } 549681824310SBarry Smith rp[i] = col; 549781824310SBarry Smith ap[i] = value; 5498e56f5c9eSBarry Smith A->nonzerostate++; 549981824310SBarry Smith noinsert:; 550081824310SBarry Smith low = i + 1; 550181824310SBarry Smith } 550281824310SBarry Smith ailen[row] = nrow; 550381824310SBarry Smith } 550481824310SBarry Smith PetscFunctionReturnVoid(); 550581824310SBarry Smith } 550698921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 550798921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 550898921bdaSJacob Faibussowitsch * original definitions */ 55099566063dSJacob Faibussowitsch #undef PetscCall 551098921bdaSJacob Faibussowitsch #undef SETERRQ 5511