1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 11d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 12d71ae5a4SJacob Faibussowitsch { 134099cc6bSBarry Smith PetscBool flg; 144099cc6bSBarry Smith char type[256]; 154099cc6bSBarry Smith 164099cc6bSBarry Smith PetscFunctionBegin; 17d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 189566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 199566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 20d0609cedSBarry Smith PetscOptionsEnd(); 214099cc6bSBarry Smith PetscFunctionReturn(0); 224099cc6bSBarry Smith } 234099cc6bSBarry Smith 24d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 25d71ae5a4SJacob Faibussowitsch { 260716a85fSBarry Smith PetscInt i, m, n; 270716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 280716a85fSBarry Smith 290716a85fSBarry Smith PetscFunctionBegin; 309566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 319566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 320716a85fSBarry Smith if (type == NORM_2) { 33ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 340716a85fSBarry Smith } else if (type == NORM_1) { 35ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 360716a85fSBarry Smith } else if (type == NORM_INFINITY) { 37ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 38857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 39ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 40857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 42857cbf51SRichard Tran Mills } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 430716a85fSBarry Smith 440716a85fSBarry Smith if (type == NORM_2) { 45a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 47a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 480716a85fSBarry Smith } 490716a85fSBarry Smith PetscFunctionReturn(0); 500716a85fSBarry Smith } 510716a85fSBarry Smith 52d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 53d71ae5a4SJacob Faibussowitsch { 543a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 553a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 563a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 573a062f41SBarry Smith PetscInt *rows; 583a062f41SBarry Smith 593a062f41SBarry Smith PetscFunctionBegin; 603a062f41SBarry Smith for (i = 0; i < m; i++) { 61ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 623a062f41SBarry Smith } 639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 643a062f41SBarry Smith cnt = 0; 653a062f41SBarry Smith for (i = 0; i < m; i++) { 663a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 673a062f41SBarry Smith rows[cnt] = i; 683a062f41SBarry Smith cnt++; 693a062f41SBarry Smith } 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 723a062f41SBarry Smith PetscFunctionReturn(0); 733a062f41SBarry Smith } 743a062f41SBarry Smith 75d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 76d71ae5a4SJacob Faibussowitsch { 776ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 78fff043a9SJunchao Zhang const MatScalar *aa; 796ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 80b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 816ce1633cSBarry Smith PetscInt *rows; 826ce1633cSBarry Smith 836ce1633cSBarry Smith PetscFunctionBegin; 849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 859566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 866ce1633cSBarry Smith diag = a->diag; 876ce1633cSBarry Smith for (i = 0; i < m; i++) { 88ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 896ce1633cSBarry Smith } 909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 916ce1633cSBarry Smith cnt = 0; 926ce1633cSBarry Smith for (i = 0; i < m; i++) { 93ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 946ce1633cSBarry Smith } 95f1f41ecbSJed Brown *nrows = cnt; 96f1f41ecbSJed Brown *zrows = rows; 979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 98f1f41ecbSJed Brown PetscFunctionReturn(0); 99f1f41ecbSJed Brown } 100f1f41ecbSJed Brown 101d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 102d71ae5a4SJacob Faibussowitsch { 103f1f41ecbSJed Brown PetscInt nrows, *rows; 104f1f41ecbSJed Brown 105f1f41ecbSJed Brown PetscFunctionBegin; 1060298fd71SBarry Smith *zrows = NULL; 1079566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1089566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1096ce1633cSBarry Smith PetscFunctionReturn(0); 1106ce1633cSBarry Smith } 1116ce1633cSBarry Smith 112d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 113d71ae5a4SJacob Faibussowitsch { 114b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 115b3a44c85SBarry Smith const MatScalar *aa; 116b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 117b3a44c85SBarry Smith const PetscInt *ii; 118b3a44c85SBarry Smith PetscInt n, i, j, *rows; 119b3a44c85SBarry Smith 120b3a44c85SBarry Smith PetscFunctionBegin; 1219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 122f4259b30SLisandro Dalcin *keptrows = NULL; 123b3a44c85SBarry Smith ii = a->i; 124b3a44c85SBarry Smith for (i = 0; i < m; i++) { 125b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 126b3a44c85SBarry Smith if (!n) { 127b3a44c85SBarry Smith cnt++; 128b3a44c85SBarry Smith goto ok1; 129b3a44c85SBarry Smith } 1302e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 131b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 132b3a44c85SBarry Smith } 133b3a44c85SBarry Smith cnt++; 134b3a44c85SBarry Smith ok1:; 135b3a44c85SBarry Smith } 1362e5835c6SStefano Zampini if (!cnt) { 1379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1382e5835c6SStefano Zampini PetscFunctionReturn(0); 1392e5835c6SStefano Zampini } 1409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 141b3a44c85SBarry Smith cnt = 0; 142b3a44c85SBarry Smith for (i = 0; i < m; i++) { 143b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 144b3a44c85SBarry Smith if (!n) continue; 1452e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 146b3a44c85SBarry Smith if (aa[j] != 0.0) { 147b3a44c85SBarry Smith rows[cnt++] = i; 148b3a44c85SBarry Smith break; 149b3a44c85SBarry Smith } 150b3a44c85SBarry Smith } 151b3a44c85SBarry Smith } 1529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1539566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 154b3a44c85SBarry Smith PetscFunctionReturn(0); 155b3a44c85SBarry Smith } 156b3a44c85SBarry Smith 157d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 158d71ae5a4SJacob Faibussowitsch { 15979299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16099e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16199e65526SBarry Smith const PetscInt *diag; 1622e5835c6SStefano Zampini MatScalar *aa; 16399e65526SBarry Smith const PetscScalar *v; 164ace3abfcSBarry Smith PetscBool missing; 16579299369SBarry Smith 16679299369SBarry Smith PetscFunctionBegin; 16709f38230SBarry Smith if (Y->assembled) { 1689566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 16909f38230SBarry Smith if (!missing) { 17079299369SBarry Smith diag = aij->diag; 1719566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 17379299369SBarry Smith if (is == INSERT_VALUES) { 174ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 17579299369SBarry Smith } else { 176ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 17779299369SBarry Smith } 1789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1799566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 18079299369SBarry Smith PetscFunctionReturn(0); 18179299369SBarry Smith } 1829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 18309f38230SBarry Smith } 1849566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 18509f38230SBarry Smith PetscFunctionReturn(0); 18609f38230SBarry Smith } 18779299369SBarry Smith 188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 189d71ae5a4SJacob Faibussowitsch { 190416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19197f1f81fSBarry Smith PetscInt i, ishift; 19217ab2063SBarry Smith 1933a40ed3dSBarry Smith PetscFunctionBegin; 194f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 1953a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 196bfeeae90SHong Zhang ishift = 0; 197b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 1989566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 199bfeeae90SHong Zhang } else if (oshift == 1) { 2001a83f524SJed Brown PetscInt *tia; 201d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2023b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2041a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2051a83f524SJed Brown *ia = tia; 206ecc77c7aSBarry Smith if (ja) { 2071a83f524SJed Brown PetscInt *tja; 2089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2091a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2101a83f524SJed Brown *ja = tja; 211ecc77c7aSBarry Smith } 2126945ee14SBarry Smith } else { 213ecc77c7aSBarry Smith *ia = a->i; 214ecc77c7aSBarry Smith if (ja) *ja = a->j; 215a2ce50c7SBarry Smith } 2163a40ed3dSBarry Smith PetscFunctionReturn(0); 217a2744918SBarry Smith } 218a2744918SBarry Smith 219d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 220d71ae5a4SJacob Faibussowitsch { 2213a40ed3dSBarry Smith PetscFunctionBegin; 2223a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 223b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2249566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2259566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 226bcd2baecSBarry Smith } 2273a40ed3dSBarry Smith PetscFunctionReturn(0); 22817ab2063SBarry Smith } 22917ab2063SBarry Smith 230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 231d71ae5a4SJacob Faibussowitsch { 2323b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 233d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 23497f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2353b2fbd54SBarry Smith 2363a40ed3dSBarry Smith PetscFunctionBegin; 237899cda47SBarry Smith *nn = n; 2383a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2393b2fbd54SBarry Smith if (symmetric) { 2409566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2413b2fbd54SBarry Smith } else { 2429566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2453b2fbd54SBarry Smith jj = a->j; 246ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2473b2fbd54SBarry Smith cia[0] = oshift; 248ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2499566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2503b2fbd54SBarry Smith jj = a->j; 251a93ec695SBarry Smith for (row = 0; row < m; row++) { 252a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 253a93ec695SBarry Smith for (i = 0; i < mr; i++) { 254bfeeae90SHong Zhang col = *jj++; 2552205254eSKarl Rupp 2563b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2573b2fbd54SBarry Smith } 2583b2fbd54SBarry Smith } 2599566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2609371c9d4SSatish Balay *ia = cia; 2619371c9d4SSatish Balay *ja = cja; 2623b2fbd54SBarry Smith } 2633a40ed3dSBarry Smith PetscFunctionReturn(0); 2643b2fbd54SBarry Smith } 2653b2fbd54SBarry Smith 266d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 267d71ae5a4SJacob Faibussowitsch { 2683a40ed3dSBarry Smith PetscFunctionBegin; 2693a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2703b2fbd54SBarry Smith 2719566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2729566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2733a40ed3dSBarry Smith PetscFunctionReturn(0); 2743b2fbd54SBarry Smith } 2753b2fbd54SBarry Smith 2767cee066cSHong Zhang /* 2777cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2787cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 279040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2807cee066cSHong Zhang */ 281d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 282d71ae5a4SJacob Faibussowitsch { 2837cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2847cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 285071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2867cee066cSHong Zhang PetscInt *cspidx; 287071fcb05SBarry Smith const PetscInt *jj; 2887cee066cSHong Zhang 2897cee066cSHong Zhang PetscFunctionBegin; 2907cee066cSHong Zhang *nn = n; 2917cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 292625f6d37SHong Zhang 2939566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2959566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2969566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 2977cee066cSHong Zhang jj = a->j; 298ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2997cee066cSHong Zhang cia[0] = oshift; 300ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3019566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3027cee066cSHong Zhang jj = a->j; 3037cee066cSHong Zhang for (row = 0; row < m; row++) { 3047cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3057cee066cSHong Zhang for (i = 0; i < mr; i++) { 3067cee066cSHong Zhang col = *jj++; 307071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 308071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 309071fcb05SBarry Smith cja[tmp] = row + oshift; 3107cee066cSHong Zhang } 3117cee066cSHong Zhang } 3129566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 313071fcb05SBarry Smith *ia = cia; 314071fcb05SBarry Smith *ja = cja; 3157cee066cSHong Zhang *spidx = cspidx; 3167cee066cSHong Zhang PetscFunctionReturn(0); 3177cee066cSHong Zhang } 3187cee066cSHong Zhang 319d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 320d71ae5a4SJacob Faibussowitsch { 3217cee066cSHong Zhang PetscFunctionBegin; 3229566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3239566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3247cee066cSHong Zhang PetscFunctionReturn(0); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 328d71ae5a4SJacob Faibussowitsch { 32987d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33087d4246cSBarry Smith PetscInt *ai = a->i; 331fff043a9SJunchao Zhang PetscScalar *aa; 33287d4246cSBarry Smith 33387d4246cSBarry Smith PetscFunctionBegin; 3349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3359566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 33787d4246cSBarry Smith PetscFunctionReturn(0); 33887d4246cSBarry Smith } 33987d4246cSBarry Smith 340bd04181cSBarry Smith /* 341bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 342bd04181cSBarry Smith 343bd04181cSBarry Smith - a single row of values is set with each call 344bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 345bd04181cSBarry Smith - the values are always added to the matrix, not set 346bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 347bd04181cSBarry Smith 3481f763a69SBarry Smith This does NOT assume the global column indices are sorted 349bd04181cSBarry Smith 3501f763a69SBarry Smith */ 351bd04181cSBarry Smith 352af0996ceSBarry Smith #include <petsc/private/isimpl.h> 353d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 354d71ae5a4SJacob Faibussowitsch { 355189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3561f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3571f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3581f763a69SBarry Smith PetscInt lastcol = -1; 359fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 360189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 361189e4007SBarry Smith 362fff043a9SJunchao Zhang PetscFunctionBegin; 3639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 364f38dd0b8SBarry Smith row = ridx[im[0]]; 3651f763a69SBarry Smith rp = aj + ai[row]; 3661f763a69SBarry Smith ap = aa + ai[row]; 3671f763a69SBarry Smith nrow = ailen[row]; 368189e4007SBarry Smith low = 0; 369189e4007SBarry Smith high = nrow; 370189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 371189e4007SBarry Smith col = cidx[in[l]]; 372f38dd0b8SBarry Smith value = v[l]; 373189e4007SBarry Smith 374189e4007SBarry Smith if (col <= lastcol) low = 0; 375189e4007SBarry Smith else high = nrow; 376189e4007SBarry Smith lastcol = col; 377189e4007SBarry Smith while (high - low > 5) { 378189e4007SBarry Smith t = (low + high) / 2; 379189e4007SBarry Smith if (rp[t] > col) high = t; 380189e4007SBarry Smith else low = t; 381189e4007SBarry Smith } 382189e4007SBarry Smith for (i = low; i < high; i++) { 383189e4007SBarry Smith if (rp[i] == col) { 3841f763a69SBarry Smith ap[i] += value; 385189e4007SBarry Smith low = i + 1; 3861f763a69SBarry Smith break; 387189e4007SBarry Smith } 388189e4007SBarry Smith } 389189e4007SBarry Smith } 3909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 391f38dd0b8SBarry Smith return 0; 392189e4007SBarry Smith } 393189e4007SBarry Smith 394d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 395d71ae5a4SJacob Faibussowitsch { 396416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 397e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 39897f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 399e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 400ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 401ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 402ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 40317ab2063SBarry Smith 4043a40ed3dSBarry Smith PetscFunctionBegin; 4059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 40617ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 407416022c9SBarry Smith row = im[k]; 4085ef9f2a5SBarry Smith if (row < 0) continue; 4096bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 410720833daSHong Zhang rp = aj + ai[row]; 411876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 4129371c9d4SSatish Balay rmax = imax[row]; 4139371c9d4SSatish Balay nrow = ailen[row]; 414416022c9SBarry Smith low = 0; 415c71e6ed7SBarry Smith high = nrow; 41617ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4175ef9f2a5SBarry Smith if (in[l] < 0) continue; 4186bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 419bfeeae90SHong Zhang col = in[l]; 420071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 421071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 42236db0b34SBarry Smith 4232205254eSKarl Rupp if (col <= lastcol) low = 0; 4242205254eSKarl Rupp else high = nrow; 425e2ee6c50SBarry Smith lastcol = col; 426416022c9SBarry Smith while (high - low > 5) { 427416022c9SBarry Smith t = (low + high) / 2; 428416022c9SBarry Smith if (rp[t] > col) high = t; 429416022c9SBarry Smith else low = t; 43017ab2063SBarry Smith } 431416022c9SBarry Smith for (i = low; i < high; i++) { 43217ab2063SBarry Smith if (rp[i] > col) break; 43317ab2063SBarry Smith if (rp[i] == col) { 434876c6284SHong Zhang if (!A->structure_only) { 4350c0d7e18SFande Kong if (is == ADD_VALUES) { 4360c0d7e18SFande Kong ap[i] += value; 4370c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4389371c9d4SSatish Balay } else ap[i] = value; 439720833daSHong Zhang } 440e44c0bd4SBarry Smith low = i + 1; 44117ab2063SBarry Smith goto noinsert; 44217ab2063SBarry Smith } 44317ab2063SBarry Smith } 444dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 445c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 44608401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 447720833daSHong Zhang if (A->structure_only) { 448876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 449720833daSHong Zhang } else { 450fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 451720833daSHong Zhang } 4529371c9d4SSatish Balay N = nrow++ - 1; 4539371c9d4SSatish Balay a->nz++; 4549371c9d4SSatish Balay high++; 455416022c9SBarry Smith /* shift up all the later entries in this row */ 4569566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 45717ab2063SBarry Smith rp[i] = col; 458580bdb30SBarry Smith if (!A->structure_only) { 4599566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 460580bdb30SBarry Smith ap[i] = value; 461580bdb30SBarry Smith } 462416022c9SBarry Smith low = i + 1; 463e56f5c9eSBarry Smith A->nonzerostate++; 464e44c0bd4SBarry Smith noinsert:; 46517ab2063SBarry Smith } 46617ab2063SBarry Smith ailen[row] = nrow; 46717ab2063SBarry Smith } 4689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4693a40ed3dSBarry Smith PetscFunctionReturn(0); 47017ab2063SBarry Smith } 47117ab2063SBarry Smith 472d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 473d71ae5a4SJacob Faibussowitsch { 47419b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 47519b08ed1SBarry Smith PetscInt *rp, k, row; 47619b08ed1SBarry Smith PetscInt *ai = a->i; 47719b08ed1SBarry Smith PetscInt *aj = a->j; 478fff043a9SJunchao Zhang MatScalar *aa, *ap; 47919b08ed1SBarry Smith 48019b08ed1SBarry Smith PetscFunctionBegin; 48128b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 48208401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 483fff043a9SJunchao Zhang 4849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 48519b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 48619b08ed1SBarry Smith row = im[k]; 48719b08ed1SBarry Smith rp = aj + ai[row]; 48819b08ed1SBarry Smith ap = aa + ai[row]; 48919b08ed1SBarry Smith 4909566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49119b08ed1SBarry Smith if (!A->structure_only) { 49219b08ed1SBarry Smith if (v) { 4939566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 49419b08ed1SBarry Smith v += n; 49519b08ed1SBarry Smith } else { 4969566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 49719b08ed1SBarry Smith } 49819b08ed1SBarry Smith } 49919b08ed1SBarry Smith a->ilen[row] = n; 50019b08ed1SBarry Smith a->imax[row] = n; 50119b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 50219b08ed1SBarry Smith a->nz += n; 50319b08ed1SBarry Smith } 5049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 50519b08ed1SBarry Smith PetscFunctionReturn(0); 50619b08ed1SBarry Smith } 50719b08ed1SBarry Smith 50819b08ed1SBarry Smith /*@ 50919b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51019b08ed1SBarry Smith 51119b08ed1SBarry Smith Input Parameters: 51211a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 51319b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 51419b08ed1SBarry Smith 51519b08ed1SBarry Smith Level: advanced 51619b08ed1SBarry Smith 51719b08ed1SBarry Smith Notes: 51819b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 51911a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52019b08ed1SBarry Smith as always with multiple matrix assemblies. 52119b08ed1SBarry Smith 522db781477SPatrick Sanan .seealso: `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 52319b08ed1SBarry Smith @*/ 52419b08ed1SBarry Smith 525d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 526d71ae5a4SJacob Faibussowitsch { 52719b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 52819b08ed1SBarry Smith 52919b08ed1SBarry Smith PetscFunctionBegin; 5309566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5319566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53219b08ed1SBarry Smith a->maxnz = nztotal; 5334dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 53419b08ed1SBarry Smith if (!a->ilen) { 5359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 53619b08ed1SBarry Smith } else { 5379566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 53819b08ed1SBarry Smith } 53919b08ed1SBarry Smith 54019b08ed1SBarry Smith /* allocate the matrix space */ 54119b08ed1SBarry Smith if (A->structure_only) { 5429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal, &a->j)); 5439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i)); 54419b08ed1SBarry Smith } else { 5459566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i)); 54619b08ed1SBarry Smith } 54719b08ed1SBarry Smith a->i[0] = 0; 54819b08ed1SBarry Smith if (A->structure_only) { 54919b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 55019b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55119b08ed1SBarry Smith } else { 55219b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 55319b08ed1SBarry Smith a->free_a = PETSC_TRUE; 55419b08ed1SBarry Smith } 55519b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 55619b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 55719b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 55819b08ed1SBarry Smith PetscFunctionReturn(0); 55919b08ed1SBarry Smith } 56019b08ed1SBarry Smith 561d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 562d71ae5a4SJacob Faibussowitsch { 563071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 564071fcb05SBarry Smith PetscInt *rp, k, row; 565071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 566071fcb05SBarry Smith PetscInt *aj = a->j; 567fff043a9SJunchao Zhang MatScalar *aa, *ap; 568071fcb05SBarry Smith 569071fcb05SBarry Smith PetscFunctionBegin; 5709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 571071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 572071fcb05SBarry Smith row = im[k]; 5736bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 574071fcb05SBarry Smith rp = aj + ai[row]; 575071fcb05SBarry Smith ap = aa + ai[row]; 57648a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 577071fcb05SBarry Smith if (!A->structure_only) { 578071fcb05SBarry Smith if (v) { 5799566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 580071fcb05SBarry Smith v += n; 581071fcb05SBarry Smith } else { 5829566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 583071fcb05SBarry Smith } 584071fcb05SBarry Smith } 585071fcb05SBarry Smith ailen[row] = n; 586071fcb05SBarry Smith a->nz += n; 587071fcb05SBarry Smith } 5889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 589071fcb05SBarry Smith PetscFunctionReturn(0); 590071fcb05SBarry Smith } 591071fcb05SBarry Smith 592d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 593d71ae5a4SJacob Faibussowitsch { 5947eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 59597f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59697f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 597fff043a9SJunchao Zhang MatScalar *ap, *aa; 5987eb43aa7SLois Curfman McInnes 5993a40ed3dSBarry Smith PetscFunctionBegin; 6009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 6017eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6027eb43aa7SLois Curfman McInnes row = im[k]; 6039371c9d4SSatish Balay if (row < 0) { 6049371c9d4SSatish Balay v += n; 6059371c9d4SSatish Balay continue; 6069371c9d4SSatish Balay } /* negative row */ 60754c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6089371c9d4SSatish Balay rp = aj + ai[row]; 6099371c9d4SSatish Balay ap = aa + ai[row]; 6107eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6117eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6129371c9d4SSatish Balay if (in[l] < 0) { 6139371c9d4SSatish Balay v++; 6149371c9d4SSatish Balay continue; 6159371c9d4SSatish Balay } /* negative column */ 61654c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 617bfeeae90SHong Zhang col = in[l]; 6189371c9d4SSatish Balay high = nrow; 6199371c9d4SSatish Balay low = 0; /* assume unsorted */ 6207eb43aa7SLois Curfman McInnes while (high - low > 5) { 6217eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6227eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6237eb43aa7SLois Curfman McInnes else low = t; 6247eb43aa7SLois Curfman McInnes } 6257eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6267eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6277eb43aa7SLois Curfman McInnes if (rp[i] == col) { 628b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6297eb43aa7SLois Curfman McInnes goto finished; 6307eb43aa7SLois Curfman McInnes } 6317eb43aa7SLois Curfman McInnes } 63297e567efSBarry Smith *v++ = 0.0; 6337eb43aa7SLois Curfman McInnes finished:; 6347eb43aa7SLois Curfman McInnes } 6357eb43aa7SLois Curfman McInnes } 6369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 6373a40ed3dSBarry Smith PetscFunctionReturn(0); 6387eb43aa7SLois Curfman McInnes } 6397eb43aa7SLois Curfman McInnes 640d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 641d71ae5a4SJacob Faibussowitsch { 6423ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 643c898d852SStefano Zampini const PetscScalar *av; 6443ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6453ea6fe3dSLisandro Dalcin PetscInt *rowlens; 64617ab2063SBarry Smith 6473a40ed3dSBarry Smith PetscFunctionBegin; 6489566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6492205254eSKarl Rupp 6503ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6513ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6523ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6533ea6fe3dSLisandro Dalcin nz = A->nz; 654416022c9SBarry Smith 6553ea6fe3dSLisandro Dalcin /* write matrix header */ 6563ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6579371c9d4SSatish Balay header[1] = M; 6589371c9d4SSatish Balay header[2] = N; 6599371c9d4SSatish Balay header[3] = nz; 6609566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 661416022c9SBarry Smith 6623ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6643ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6659566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6669566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6673ea6fe3dSLisandro Dalcin /* store column indices */ 6689566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 669416022c9SBarry Smith /* store nonzero values */ 6709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6719566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 673b37d52dbSMark F. Adams 6743ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6759566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6763a40ed3dSBarry Smith PetscFunctionReturn(0); 67717ab2063SBarry Smith } 678416022c9SBarry Smith 679d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 680d71ae5a4SJacob Faibussowitsch { 6817dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6827dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6837dc0baabSHong Zhang 6847dc0baabSHong Zhang PetscFunctionBegin; 6859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6867dc0baabSHong Zhang for (i = 0; i < m; i++) { 6879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 68848a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6907dc0baabSHong Zhang } 6919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6927dc0baabSHong Zhang PetscFunctionReturn(0); 6937dc0baabSHong Zhang } 6947dc0baabSHong Zhang 69509573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 696cd155464SBarry Smith 697d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 698d71ae5a4SJacob Faibussowitsch { 699416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 700c898d852SStefano Zampini const PetscScalar *av; 70160e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 702e060cb09SBarry Smith const char *name; 703f3ef73ceSBarry Smith PetscViewerFormat format; 70417ab2063SBarry Smith 7053a40ed3dSBarry Smith PetscFunctionBegin; 7067dc0baabSHong Zhang if (A->structure_only) { 7079566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7087dc0baabSHong Zhang PetscFunctionReturn(0); 7097dc0baabSHong Zhang } 71043e49210SHong Zhang 7119566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 7122e5835c6SStefano Zampini if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 7132e5835c6SStefano Zampini 714c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 71771c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 71897f1f81fSBarry Smith PetscInt nofinalvalue = 0; 71960e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 720c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 721d00d2cf4SBarry Smith nofinalvalue = 1; 722d00d2cf4SBarry Smith } 7239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 726fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 728fbfe6fa7SJed Brown #else 7299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 730fbfe6fa7SJed Brown #endif 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73217ab2063SBarry Smith 73317ab2063SBarry Smith for (i = 0; i < m; i++) { 73460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 735aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 73717ab2063SBarry Smith #else 7389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 73917ab2063SBarry Smith #endif 74017ab2063SBarry Smith } 74117ab2063SBarry Smith } 742d00d2cf4SBarry Smith if (nofinalvalue) { 743c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 745c337ccceSJed Brown #else 7469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 747c337ccceSJed Brown #endif 748d00d2cf4SBarry Smith } 7499566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 752fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 75444cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 75660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 757aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 75836db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76036db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76236db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7646831982aSBarry Smith } 76544cd7ae7SLois Curfman McInnes #else 7669566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 76744cd7ae7SLois Curfman McInnes #endif 76844cd7ae7SLois Curfman McInnes } 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77044cd7ae7SLois Curfman McInnes } 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 772fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 77397f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 776496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 777496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 77860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 779496be53dSLois Curfman McInnes if (a->j[j] >= i) { 780aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78136db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 782496be53dSLois Curfman McInnes #else 783496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 784496be53dSLois Curfman McInnes #endif 785496be53dSLois Curfman McInnes } 786496be53dSLois Curfman McInnes } 787496be53dSLois Curfman McInnes } 7882e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7902e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7912205254eSKarl Rupp if (i + 4 < m) { 7929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 7932205254eSKarl Rupp } else if (i + 3 < m) { 7949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 7952205254eSKarl Rupp } else if (i + 2 < m) { 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 7972205254eSKarl Rupp } else if (i + 1 < m) { 7989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 7992205254eSKarl Rupp } else if (i < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8012205254eSKarl Rupp } else { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8032205254eSKarl Rupp } 804496be53dSLois Curfman McInnes } 8059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8069566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 807496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 80860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8099566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 810496be53dSLois Curfman McInnes } 8119566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 812496be53dSLois Curfman McInnes } 8139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 814496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 816496be53dSLois Curfman McInnes if (a->j[j] >= i) { 817aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 81848a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 819496be53dSLois Curfman McInnes #else 8209566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 821496be53dSLois Curfman McInnes #endif 822496be53dSLois Curfman McInnes } 823496be53dSLois Curfman McInnes } 8249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 825496be53dSLois Curfman McInnes } 8269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 827fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 82897f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 82987828ca2SBarry Smith PetscScalar value; 83068f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83168f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83268f1ed48SBarry Smith 83368f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 83468f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 83568f1ed48SBarry Smith realonly = PETSC_FALSE; 83668f1ed48SBarry Smith break; 83768f1ed48SBarry Smith } 83868f1ed48SBarry Smith } 83968f1ed48SBarry Smith #endif 84002594712SBarry Smith 8419566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84202594712SBarry Smith for (i = 0; i < m; i++) { 84302594712SBarry Smith jcnt = 0; 844d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 845e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 84602594712SBarry Smith value = a->a[cnt++]; 847e24b481bSBarry Smith jcnt++; 84802594712SBarry Smith } else { 84902594712SBarry Smith value = 0.0; 85002594712SBarry Smith } 851aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85268f1ed48SBarry Smith if (realonly) { 8539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 85468f1ed48SBarry Smith } else { 8559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 85668f1ed48SBarry Smith } 85702594712SBarry Smith #else 8589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 85902594712SBarry Smith #endif 86002594712SBarry Smith } 8619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86202594712SBarry Smith } 8639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8643c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 865150b93efSMatthew G. Knepley PetscInt fshift = 1; 8669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8673c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8693c215bfdSMatthew Knepley #else 8709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8713c215bfdSMatthew Knepley #endif 8729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8733c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 87460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8773c215bfdSMatthew Knepley #else 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8793c215bfdSMatthew Knepley #endif 8803c215bfdSMatthew Knepley } 8813c215bfdSMatthew Knepley } 8829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8833a40ed3dSBarry Smith } else { 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 885d5f3da31SBarry Smith if (A->factortype) { 88616cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 88816cd7e1dSShri Abhyankar /* L part */ 88960e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89116cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 89316cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 89516cd7e1dSShri Abhyankar } else { 8969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 89716cd7e1dSShri Abhyankar } 89816cd7e1dSShri Abhyankar #else 8999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90016cd7e1dSShri Abhyankar #endif 90116cd7e1dSShri Abhyankar } 90216cd7e1dSShri Abhyankar /* diagonal */ 90316cd7e1dSShri Abhyankar j = a->diag[i]; 90416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 90516cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 90716cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 90916cd7e1dSShri Abhyankar } else { 9109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91116cd7e1dSShri Abhyankar } 91216cd7e1dSShri Abhyankar #else 9139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 91416cd7e1dSShri Abhyankar #endif 91516cd7e1dSShri Abhyankar 91616cd7e1dSShri Abhyankar /* U part */ 91760e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 91816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9229566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 92316cd7e1dSShri Abhyankar } else { 9249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 92516cd7e1dSShri Abhyankar } 92616cd7e1dSShri Abhyankar #else 9279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 92816cd7e1dSShri Abhyankar #endif 92916cd7e1dSShri Abhyankar } 9309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93116cd7e1dSShri Abhyankar } 93216cd7e1dSShri Abhyankar } else { 93317ab2063SBarry Smith for (i = 0; i < m; i++) { 9349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 93560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 936aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 93736db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 93936db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9413a40ed3dSBarry Smith } else { 9429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 94317ab2063SBarry Smith } 94417ab2063SBarry Smith #else 9459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 94617ab2063SBarry Smith #endif 94717ab2063SBarry Smith } 9489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 94917ab2063SBarry Smith } 95016cd7e1dSShri Abhyankar } 9519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95217ab2063SBarry Smith } 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9543a40ed3dSBarry Smith PetscFunctionReturn(0); 955416022c9SBarry Smith } 956416022c9SBarry Smith 9579804daf3SBarry Smith #include <petscdraw.h> 958d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 959d71ae5a4SJacob Faibussowitsch { 960480ef9eaSBarry Smith Mat A = (Mat)Aa; 961416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 962383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 963383922c3SLisandro Dalcin int color; 964b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 965b0a32e0cSBarry Smith PetscViewer viewer; 966f3ef73ceSBarry Smith PetscViewerFormat format; 967fff043a9SJunchao Zhang const PetscScalar *aa; 968cddf8d76SBarry Smith 9693a40ed3dSBarry Smith PetscFunctionBegin; 9709566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9719566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9729566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 973383922c3SLisandro Dalcin 974416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 976fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 977d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9780513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 979b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 980416022c9SBarry Smith for (i = 0; i < m; i++) { 9819371c9d4SSatish Balay y_l = m - i - 1.0; 9829371c9d4SSatish Balay y_r = y_l + 1.0; 983bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9849371c9d4SSatish Balay x_l = a->j[j]; 9859371c9d4SSatish Balay x_r = x_l + 1.0; 986fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9879566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 988cddf8d76SBarry Smith } 989cddf8d76SBarry Smith } 990b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 991cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9929371c9d4SSatish Balay y_l = m - i - 1.0; 9939371c9d4SSatish Balay y_r = y_l + 1.0; 994bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9959371c9d4SSatish Balay x_l = a->j[j]; 9969371c9d4SSatish Balay x_r = x_l + 1.0; 997fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 9989566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 999cddf8d76SBarry Smith } 1000cddf8d76SBarry Smith } 1001b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1002cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10039371c9d4SSatish Balay y_l = m - i - 1.0; 10049371c9d4SSatish Balay y_r = y_l + 1.0; 1005bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10069371c9d4SSatish Balay x_l = a->j[j]; 10079371c9d4SSatish Balay x_r = x_l + 1.0; 1008fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10099566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1010416022c9SBarry Smith } 1011416022c9SBarry Smith } 1012d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10130513a670SBarry Smith } else { 10140513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10150513a670SBarry Smith /* first determine max of all nonzero values */ 1016b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1017383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1018b0a32e0cSBarry Smith PetscDraw popup; 10190513a670SBarry Smith 10200513a670SBarry Smith for (i = 0; i < nz; i++) { 1021fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10220513a670SBarry Smith } 1023383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10249566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10259566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1026383922c3SLisandro Dalcin 1027d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10280513a670SBarry Smith for (i = 0; i < m; i++) { 1029383922c3SLisandro Dalcin y_l = m - i - 1.0; 1030383922c3SLisandro Dalcin y_r = y_l + 1.0; 1031bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1032383922c3SLisandro Dalcin x_l = a->j[j]; 1033383922c3SLisandro Dalcin x_r = x_l + 1.0; 1034fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10359566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10360513a670SBarry Smith count++; 10370513a670SBarry Smith } 10380513a670SBarry Smith } 1039d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10400513a670SBarry Smith } 10419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1042480ef9eaSBarry Smith PetscFunctionReturn(0); 1043480ef9eaSBarry Smith } 1044cddf8d76SBarry Smith 10459804daf3SBarry Smith #include <petscdraw.h> 1046d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1047d71ae5a4SJacob Faibussowitsch { 1048b0a32e0cSBarry Smith PetscDraw draw; 104936db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1050ace3abfcSBarry Smith PetscBool isnull; 1051480ef9eaSBarry Smith 1052480ef9eaSBarry Smith PetscFunctionBegin; 10539566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10549566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 1055480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 1056480ef9eaSBarry Smith 10579371c9d4SSatish Balay xr = A->cmap->n; 10589371c9d4SSatish Balay yr = A->rmap->n; 10599371c9d4SSatish Balay h = yr / 10.0; 10609371c9d4SSatish Balay w = xr / 10.0; 10619371c9d4SSatish Balay xr += w; 10629371c9d4SSatish Balay yr += h; 10639371c9d4SSatish Balay xl = -w; 10649371c9d4SSatish Balay yl = -h; 10659566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10669566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10679566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10689566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10699566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10703a40ed3dSBarry Smith PetscFunctionReturn(0); 1071416022c9SBarry Smith } 1072416022c9SBarry Smith 1073d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1074d71ae5a4SJacob Faibussowitsch { 1075ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1076416022c9SBarry Smith 10773a40ed3dSBarry Smith PetscFunctionBegin; 10789566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10799566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10809566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10811baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10821baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10831baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10849566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10853a40ed3dSBarry Smith PetscFunctionReturn(0); 108617ab2063SBarry Smith } 108719bcc07fSBarry Smith 1088d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1089d71ae5a4SJacob Faibussowitsch { 1090416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1091580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1092d0f46423SBarry Smith PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0; 109354f21887SBarry Smith MatScalar *aa = a->a, *ap; 10943447b6efSHong Zhang PetscReal ratio = 0.6; 109517ab2063SBarry Smith 10963a40ed3dSBarry Smith PetscFunctionBegin; 10973a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 10989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1099b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1100b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11019566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 1102b215bc84SStefano Zampini PetscFunctionReturn(0); 1103b215bc84SStefano Zampini } 110417ab2063SBarry Smith 110543ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 110617ab2063SBarry Smith for (i = 1; i < m; i++) { 1107416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 110817ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 110994a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111017ab2063SBarry Smith if (fshift) { 1111bfeeae90SHong Zhang ip = aj + ai[i]; 1112bfeeae90SHong Zhang ap = aa + ai[i]; 111317ab2063SBarry Smith N = ailen[i]; 11149566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 111548a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 111617ab2063SBarry Smith } 111717ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 111817ab2063SBarry Smith } 111917ab2063SBarry Smith if (m) { 112017ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112117ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112217ab2063SBarry Smith } 11237b083b7cSBarry Smith 112417ab2063SBarry Smith /* reset ilen and imax for each row */ 11257b083b7cSBarry Smith a->nonzerorowcnt = 0; 1126396832f4SHong Zhang if (A->structure_only) { 11279566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11289566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1129396832f4SHong Zhang } else { /* !A->structure_only */ 113017ab2063SBarry Smith for (i = 0; i < m; i++) { 113117ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11327b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113317ab2063SBarry Smith } 1134396832f4SHong Zhang } 1135bfeeae90SHong Zhang a->nz = ai[m]; 1136aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 113717ab2063SBarry Smith 11389566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 11399566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11409566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11419566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11422205254eSKarl Rupp 11438e58a170SBarry Smith A->info.mallocs += a->reallocs; 1144dd5f02e7SSatish Balay a->reallocs = 0; 11456712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 114636db0b34SBarry Smith a->rmax = rmax; 11474e220ebcSLois Curfman McInnes 114848a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11499566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11503a40ed3dSBarry Smith PetscFunctionReturn(0); 115117ab2063SBarry Smith } 115217ab2063SBarry Smith 1153d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1154d71ae5a4SJacob Faibussowitsch { 115599cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 115699cafbc1SBarry Smith PetscInt i, nz = a->nz; 11572e5835c6SStefano Zampini MatScalar *aa; 115899cafbc1SBarry Smith 115999cafbc1SBarry Smith PetscFunctionBegin; 11609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 116199cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 116499cafbc1SBarry Smith PetscFunctionReturn(0); 116599cafbc1SBarry Smith } 116699cafbc1SBarry Smith 1167d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1168d71ae5a4SJacob Faibussowitsch { 116999cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 117099cafbc1SBarry Smith PetscInt i, nz = a->nz; 11712e5835c6SStefano Zampini MatScalar *aa; 117299cafbc1SBarry Smith 117399cafbc1SBarry Smith PetscFunctionBegin; 11749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117599cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 117899cafbc1SBarry Smith PetscFunctionReturn(0); 117999cafbc1SBarry Smith } 118099cafbc1SBarry Smith 1181d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1182d71ae5a4SJacob Faibussowitsch { 1183fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1184fff043a9SJunchao Zhang MatScalar *aa; 11853a40ed3dSBarry Smith 11863a40ed3dSBarry Smith PetscFunctionBegin; 11879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 11889566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 11899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 11909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11913a40ed3dSBarry Smith PetscFunctionReturn(0); 119217ab2063SBarry Smith } 1193416022c9SBarry Smith 1194d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatResetPreallocationCOO_SeqAIJ(Mat A) 1195d71ae5a4SJacob Faibussowitsch { 1196cbc6b225SStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1197cbc6b225SStefano Zampini 1198cbc6b225SStefano Zampini PetscFunctionBegin; 11999566063dSJacob Faibussowitsch PetscCall(PetscFree(a->perm)); 12009566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jmap)); 1201cbc6b225SStefano Zampini PetscFunctionReturn(0); 1202cbc6b225SStefano Zampini } 1203cbc6b225SStefano Zampini 1204d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1205d71ae5a4SJacob Faibussowitsch { 1206416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1207d5d45c9bSBarry Smith 12083a40ed3dSBarry Smith PetscFunctionBegin; 1209aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1210c0aa6a63SJacob Faibussowitsch PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz); 121117ab2063SBarry Smith #endif 12129566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12139566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(A)); 12149566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12159566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12169566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12179566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12189566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12199566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12209566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12219566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12229566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12239566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12259566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12269566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1228901853e0SKris Buschelman 12296718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12306718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12316718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12326718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12336718818eSStefano Zampini due to different matrix sizes */ 12349566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12356718818eSStefano Zampini 12369566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12372e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12382e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12452e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12462e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12472e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12482e956fe4SStefano Zampini #endif 12494222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12534222ddf1SHong Zhang #endif 12543d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12563d0639e7SStefano Zampini #endif 12579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1258af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1260af8000cdSHong Zhang #endif 1261d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1263d24d4204SJose E. Roman #endif 126463c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 126763c07aadSStefano Zampini #endif 12689566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12722e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12832e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12842e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12852e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12862e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 12872e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 12882e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 12892e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 12903a40ed3dSBarry Smith PetscFunctionReturn(0); 129117ab2063SBarry Smith } 129217ab2063SBarry Smith 1293d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1294d71ae5a4SJacob Faibussowitsch { 1295416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 12963a40ed3dSBarry Smith 12973a40ed3dSBarry Smith PetscFunctionBegin; 1298a65d3064SKris Buschelman switch (op) { 1299d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1300d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1301d71ae5a4SJacob Faibussowitsch break; 1302d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1303d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1304d71ae5a4SJacob Faibussowitsch break; 1305d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1306d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1307d71ae5a4SJacob Faibussowitsch break; 1308d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1309d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1310d71ae5a4SJacob Faibussowitsch break; 1311d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1312d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1313d71ae5a4SJacob Faibussowitsch break; 1314d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1315d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1316d71ae5a4SJacob Faibussowitsch break; 1317d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1318d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1319d71ae5a4SJacob Faibussowitsch break; 13203d472b54SHong Zhang case MAT_SPD: 1321b1646e73SJed Brown case MAT_SYMMETRIC: 1322b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1323b1646e73SJed Brown case MAT_HERMITIAN: 1324b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1325957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1326b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1327b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1328b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13295021d80fSJed Brown break; 13308c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1331a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1332d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1333d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1334d71ae5a4SJacob Faibussowitsch break; 1335d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1336d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1337d71ae5a4SJacob Faibussowitsch break; 1338d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1339d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1340d71ae5a4SJacob Faibussowitsch break; 1341071fcb05SBarry Smith case MAT_SORTED_FULL: 1342071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1343071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1344071fcb05SBarry Smith break; 1345d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1346d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1347d71ae5a4SJacob Faibussowitsch break; 1348d71ae5a4SJacob Faibussowitsch default: 1349d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1350a65d3064SKris Buschelman } 13513a40ed3dSBarry Smith PetscFunctionReturn(0); 135217ab2063SBarry Smith } 135317ab2063SBarry Smith 1354d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1355d71ae5a4SJacob Faibussowitsch { 1356416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1357fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1358c898d852SStefano Zampini PetscScalar *x; 1359c898d852SStefano Zampini const PetscScalar *aa; 136017ab2063SBarry Smith 13613a40ed3dSBarry Smith PetscFunctionBegin; 13629566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 136308401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1365d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1366d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13679566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13682c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13699566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 137135e7444dSHong Zhang PetscFunctionReturn(0); 137235e7444dSHong Zhang } 137335e7444dSHong Zhang 13749566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 137535e7444dSHong Zhang for (i = 0; i < n; i++) { 1376fdc842d1SBarry Smith x[i] = 0.0; 137735e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 137835e7444dSHong Zhang if (aj[j] == i) { 137935e7444dSHong Zhang x[i] = aa[j]; 138017ab2063SBarry Smith break; 138117ab2063SBarry Smith } 138217ab2063SBarry Smith } 138317ab2063SBarry Smith } 13849566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13863a40ed3dSBarry Smith PetscFunctionReturn(0); 138717ab2063SBarry Smith } 138817ab2063SBarry Smith 1389c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1390d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1391d71ae5a4SJacob Faibussowitsch { 1392416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13935f22a7b3SSebastian Grimberg const MatScalar *aa; 1394d9ca1df4SBarry Smith PetscScalar *y; 1395d9ca1df4SBarry Smith const PetscScalar *x; 1396d0f46423SBarry Smith PetscInt m = A->rmap->n; 13975c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 13985f22a7b3SSebastian Grimberg const MatScalar *v; 1399a77337e4SBarry Smith PetscScalar alpha; 1400d9ca1df4SBarry Smith PetscInt n, i, j; 1401d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14023447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1403ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14045c897100SBarry Smith #endif 140517ab2063SBarry Smith 14063a40ed3dSBarry Smith PetscFunctionBegin; 14079566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14089566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14099566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14115c897100SBarry Smith 14125c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1413fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14145c897100SBarry Smith #else 14153447b6efSHong Zhang if (usecprow) { 14163447b6efSHong Zhang m = cprow.nrows; 14173447b6efSHong Zhang ii = cprow.i; 14187b2bb3b9SHong Zhang ridx = cprow.rindex; 14193447b6efSHong Zhang } else { 14203447b6efSHong Zhang ii = a->i; 14213447b6efSHong Zhang } 142217ab2063SBarry Smith for (i = 0; i < m; i++) { 14233447b6efSHong Zhang idx = a->j + ii[i]; 1424fff043a9SJunchao Zhang v = aa + ii[i]; 14253447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14263447b6efSHong Zhang if (usecprow) { 14277b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14283447b6efSHong Zhang } else { 142917ab2063SBarry Smith alpha = x[i]; 14303447b6efSHong Zhang } 143104fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 143217ab2063SBarry Smith } 14335c897100SBarry Smith #endif 14349566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14359566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14369566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14383a40ed3dSBarry Smith PetscFunctionReturn(0); 143917ab2063SBarry Smith } 144017ab2063SBarry Smith 1441d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1442d71ae5a4SJacob Faibussowitsch { 14435c897100SBarry Smith PetscFunctionBegin; 14449566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14459566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14465c897100SBarry Smith PetscFunctionReturn(0); 14475c897100SBarry Smith } 14485c897100SBarry Smith 1449c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 145078b84d54SShri Abhyankar 1451d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1452d71ae5a4SJacob Faibussowitsch { 1453416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1454d9fead3dSBarry Smith PetscScalar *y; 145554f21887SBarry Smith const PetscScalar *x; 1456fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1457003131ecSBarry Smith PetscInt m = A->rmap->n; 14580298fd71SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 14597b083b7cSBarry Smith PetscInt n, i; 1460362ced78SSatish Balay PetscScalar sum; 1461ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 146217ab2063SBarry Smith 1463b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 146497952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1465fee21e36SBarry Smith #endif 1466fee21e36SBarry Smith 14673a40ed3dSBarry Smith PetscFunctionBegin; 1468b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14699566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 1470b215bc84SStefano Zampini PetscFunctionReturn(0); 1471b215bc84SStefano Zampini } 14729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14739566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14749566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1475416022c9SBarry Smith ii = a->i; 14764eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14779566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 147897952fefSHong Zhang m = a->compressedrow.nrows; 147997952fefSHong Zhang ii = a->compressedrow.i; 148097952fefSHong Zhang ridx = a->compressedrow.rindex; 148197952fefSHong Zhang for (i = 0; i < m; i++) { 148297952fefSHong Zhang n = ii[i + 1] - ii[i]; 148397952fefSHong Zhang aj = a->j + ii[i]; 1484fff043a9SJunchao Zhang aa = a_a + ii[i]; 148597952fefSHong Zhang sum = 0.0; 1486003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1487003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 148897952fefSHong Zhang y[*ridx++] = sum; 148997952fefSHong Zhang } 149097952fefSHong Zhang } else { /* do not use compressed row format */ 1491b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 14923d3eaba7SBarry Smith aj = a->j; 1493fff043a9SJunchao Zhang aa = a_a; 1494b05257ddSBarry Smith fortranmultaij_(&m, x, ii, aj, aa, y); 1495b05257ddSBarry Smith #else 149617ab2063SBarry Smith for (i = 0; i < m; i++) { 1497003131ecSBarry Smith n = ii[i + 1] - ii[i]; 1498003131ecSBarry Smith aj = a->j + ii[i]; 1499fff043a9SJunchao Zhang aa = a_a + ii[i]; 150017ab2063SBarry Smith sum = 0.0; 1501003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 150217ab2063SBarry Smith y[i] = sum; 150317ab2063SBarry Smith } 15048d195f9aSBarry Smith #endif 1505b05257ddSBarry Smith } 15069566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15079566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15089566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15103a40ed3dSBarry Smith PetscFunctionReturn(0); 151117ab2063SBarry Smith } 151217ab2063SBarry Smith 1513d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1514d71ae5a4SJacob Faibussowitsch { 1515b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1516b434eb95SMatthew G. Knepley PetscScalar *y; 1517b434eb95SMatthew G. Knepley const PetscScalar *x; 1518fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1519b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1520b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1521b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1522b434eb95SMatthew G. Knepley PetscScalar sum; 1523b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1524b434eb95SMatthew G. Knepley 1525b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1526b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1527b434eb95SMatthew G. Knepley #endif 1528b434eb95SMatthew G. Knepley 1529b434eb95SMatthew G. Knepley PetscFunctionBegin; 15309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15319566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15329566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1533b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1534b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1535b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1536b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1537b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1538b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1539b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1540fff043a9SJunchao Zhang aa = a_a + ii[i]; 1541b434eb95SMatthew G. Knepley sum = 0.0; 1542b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1543b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1544b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1545b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1546b434eb95SMatthew G. Knepley } 1547b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15483d3eaba7SBarry Smith ii = a->i; 1549b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1550b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1551b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1552fff043a9SJunchao Zhang aa = a_a + ii[i]; 1553b434eb95SMatthew G. Knepley sum = 0.0; 1554b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1555b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1556b434eb95SMatthew G. Knepley y[i] = sum; 1557b434eb95SMatthew G. Knepley } 1558b434eb95SMatthew G. Knepley } 15599566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15609566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15619566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 1563b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1564b434eb95SMatthew G. Knepley } 1565b434eb95SMatthew G. Knepley 1566d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1567d71ae5a4SJacob Faibussowitsch { 1568b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1569b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1570b434eb95SMatthew G. Knepley const PetscScalar *x; 1571fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1572b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1573b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1574b434eb95SMatthew G. Knepley PetscScalar sum; 1575b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1576b434eb95SMatthew G. Knepley 1577b434eb95SMatthew G. Knepley PetscFunctionBegin; 15789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15809566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1581b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 158248a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1583b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1584b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1585b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1586b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1587b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1588b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1589fff043a9SJunchao Zhang aa = a_a + ii[i]; 1590b434eb95SMatthew G. Knepley sum = y[*ridx]; 1591b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1592b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1593b434eb95SMatthew G. Knepley } 1594b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15953d3eaba7SBarry Smith ii = a->i; 1596b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1597b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1598b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1599fff043a9SJunchao Zhang aa = a_a + ii[i]; 1600b434eb95SMatthew G. Knepley sum = y[i]; 1601b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1602b434eb95SMatthew G. Knepley z[i] = sum; 1603b434eb95SMatthew G. Knepley } 1604b434eb95SMatthew G. Knepley } 16059566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16069566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16079566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 1609b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1610b434eb95SMatthew G. Knepley } 1611b434eb95SMatthew G. Knepley 1612c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1613d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1614d71ae5a4SJacob Faibussowitsch { 1615416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1616f15663dcSBarry Smith PetscScalar *y, *z; 1617f15663dcSBarry Smith const PetscScalar *x; 1618fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1619d9ca1df4SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 1620d9ca1df4SBarry Smith PetscInt m = A->rmap->n, n, i; 1621362ced78SSatish Balay PetscScalar sum; 1622ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16239ea0dfa2SSatish Balay 16243a40ed3dSBarry Smith PetscFunctionBegin; 1625b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16269566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 1627b215bc84SStefano Zampini PetscFunctionReturn(0); 1628b215bc84SStefano Zampini } 16299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16309566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16319566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16324eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 163348a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 163497952fefSHong Zhang m = a->compressedrow.nrows; 163597952fefSHong Zhang ii = a->compressedrow.i; 163697952fefSHong Zhang ridx = a->compressedrow.rindex; 163797952fefSHong Zhang for (i = 0; i < m; i++) { 163897952fefSHong Zhang n = ii[i + 1] - ii[i]; 163997952fefSHong Zhang aj = a->j + ii[i]; 1640fff043a9SJunchao Zhang aa = a_a + ii[i]; 164197952fefSHong Zhang sum = y[*ridx]; 1642f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 164397952fefSHong Zhang z[*ridx++] = sum; 164497952fefSHong Zhang } 164597952fefSHong Zhang } else { /* do not use compressed row format */ 16463d3eaba7SBarry Smith ii = a->i; 1647f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16483d3eaba7SBarry Smith aj = a->j; 1649fff043a9SJunchao Zhang aa = a_a; 1650f15663dcSBarry Smith fortranmultaddaij_(&m, x, ii, aj, aa, y, z); 1651f15663dcSBarry Smith #else 165217ab2063SBarry Smith for (i = 0; i < m; i++) { 1653f15663dcSBarry Smith n = ii[i + 1] - ii[i]; 1654f15663dcSBarry Smith aj = a->j + ii[i]; 1655fff043a9SJunchao Zhang aa = a_a + ii[i]; 165617ab2063SBarry Smith sum = y[i]; 1657f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165817ab2063SBarry Smith z[i] = sum; 165917ab2063SBarry Smith } 166002ab625aSSatish Balay #endif 1661f15663dcSBarry Smith } 16629566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16639566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16649566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16663a40ed3dSBarry Smith PetscFunctionReturn(0); 166717ab2063SBarry Smith } 166817ab2063SBarry Smith 166917ab2063SBarry Smith /* 167017ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 167117ab2063SBarry Smith */ 1672d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1673d71ae5a4SJacob Faibussowitsch { 1674416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1675d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1676c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 167717ab2063SBarry Smith 16783a40ed3dSBarry Smith PetscFunctionBegin; 167909f38230SBarry Smith if (!a->diag) { 16809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1681c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 168209f38230SBarry Smith } 1683d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1684c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1685c0c07093SJunchao Zhang if (alreadySet) { 1686c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1687c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1688c0c07093SJunchao Zhang } 1689c0c07093SJunchao Zhang 169009f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1691bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1692bfeeae90SHong Zhang if (a->j[j] == i) { 169309f38230SBarry Smith a->diag[i] = j; 169417ab2063SBarry Smith break; 169517ab2063SBarry Smith } 169617ab2063SBarry Smith } 169717ab2063SBarry Smith } 16983a40ed3dSBarry Smith PetscFunctionReturn(0); 169917ab2063SBarry Smith } 170017ab2063SBarry Smith 1701d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1702d71ae5a4SJacob Faibussowitsch { 170361ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 170461ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 170561ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 170661ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 170761ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 170861ecd0c6SBarry Smith 170961ecd0c6SBarry Smith PetscFunctionBegin; 171061ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17129566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 171361ecd0c6SBarry Smith PetscFunctionReturn(0); 171461ecd0c6SBarry Smith } 171561ecd0c6SBarry Smith 171661ecd0c6SBarry Smith if (a->diagonaldense) { 171761ecd0c6SBarry Smith cnt = 0; 171861ecd0c6SBarry Smith } else { 17199566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 172061ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1721349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 172261ecd0c6SBarry Smith cnt++; 172361ecd0c6SBarry Smith mdiag[i] = 1; 172461ecd0c6SBarry Smith } 172561ecd0c6SBarry Smith } 172661ecd0c6SBarry Smith } 172761ecd0c6SBarry Smith if (!cnt) { 17289566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 172961ecd0c6SBarry Smith } else { 1730b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1731b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 173261ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij; 173361ecd0c6SBarry Smith 173461ecd0c6SBarry Smith a->a = NULL; 173561ecd0c6SBarry Smith a->j = NULL; 173661ecd0c6SBarry Smith a->i = NULL; 173761ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1738ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 174061ecd0c6SBarry Smith 174161ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 174261ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17439566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 174448a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1745447d62f5SStefano Zampini } 17469566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17479566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 174861ecd0c6SBarry Smith if (singlemalloc) { 17499566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda, oldj, oldi)); 175061ecd0c6SBarry Smith } else { 17519566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17529566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17539566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 175461ecd0c6SBarry Smith } 175561ecd0c6SBarry Smith } 17569566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 175761ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 175861ecd0c6SBarry Smith PetscFunctionReturn(0); 175961ecd0c6SBarry Smith } 176061ecd0c6SBarry Smith 1761be5855fcSBarry Smith /* 1762be5855fcSBarry Smith Checks for missing diagonals 1763be5855fcSBarry Smith */ 1764d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1765d71ae5a4SJacob Faibussowitsch { 1766be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17677734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1768be5855fcSBarry Smith 1769be5855fcSBarry Smith PetscFunctionBegin; 177009f38230SBarry Smith *missing = PETSC_FALSE; 17717734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 177209f38230SBarry Smith *missing = PETSC_TRUE; 177309f38230SBarry Smith if (d) *d = 0; 17749566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 177509f38230SBarry Smith } else { 177601445905SHong Zhang PetscInt n; 177701445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1778f1e2ffcdSBarry Smith diag = a->diag; 177901445905SHong Zhang for (i = 0; i < n; i++) { 17807734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 178109f38230SBarry Smith *missing = PETSC_TRUE; 178209f38230SBarry Smith if (d) *d = i; 17839566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1784358d2f5dSShri Abhyankar break; 178509f38230SBarry Smith } 1786be5855fcSBarry Smith } 1787be5855fcSBarry Smith } 1788be5855fcSBarry Smith PetscFunctionReturn(0); 1789be5855fcSBarry Smith } 1790be5855fcSBarry Smith 17910da83c2eSBarry Smith #include <petscblaslapack.h> 17920da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 17930da83c2eSBarry Smith 17940da83c2eSBarry Smith /* 17950da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 17960da83c2eSBarry Smith */ 1797d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1798d71ae5a4SJacob Faibussowitsch { 17990da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18000da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18010da83c2eSBarry Smith const PetscReal shift = 0.0; 18020da83c2eSBarry Smith PetscInt ipvt[5]; 18030da83c2eSBarry Smith PetscScalar work[25], *v_work; 18040da83c2eSBarry Smith 18050da83c2eSBarry Smith PetscFunctionBegin; 18060da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18070da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 180808401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1809ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18109566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 181148a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18120da83c2eSBarry Smith ncnt = 0; 18130da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18140da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18159566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18160da83c2eSBarry Smith switch (bsizes[i]) { 1817d71ae5a4SJacob Faibussowitsch case 1: 1818d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1819d71ae5a4SJacob Faibussowitsch break; 18200da83c2eSBarry Smith case 2: 18219566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18220da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18239566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18240da83c2eSBarry Smith break; 18250da83c2eSBarry Smith case 3: 18269566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18270da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18289566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18290da83c2eSBarry Smith break; 18300da83c2eSBarry Smith case 4: 18319566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18320da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18339566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18340da83c2eSBarry Smith break; 18350da83c2eSBarry Smith case 5: 18369566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18370da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18389566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18390da83c2eSBarry Smith break; 18400da83c2eSBarry Smith case 6: 18419566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18420da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18439566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18440da83c2eSBarry Smith break; 18450da83c2eSBarry Smith case 7: 18469566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18470da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18489566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18490da83c2eSBarry Smith break; 18500da83c2eSBarry Smith default: 18519566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18520da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18539566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18540da83c2eSBarry Smith } 18550da83c2eSBarry Smith ncnt += bsizes[i]; 18560da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 18570da83c2eSBarry Smith } 185848a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18599566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18600da83c2eSBarry Smith PetscFunctionReturn(0); 18610da83c2eSBarry Smith } 18620da83c2eSBarry Smith 1863422a814eSBarry Smith /* 1864422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1865422a814eSBarry Smith */ 1866d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1867d71ae5a4SJacob Faibussowitsch { 186871f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1869d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18702e5835c6SStefano Zampini const MatScalar *v; 187154f21887SBarry Smith PetscScalar *idiag, *mdiag; 187271f1c65dSBarry Smith 187371f1c65dSBarry Smith PetscFunctionBegin; 187471f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 18759566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 187671f1c65dSBarry Smith diag = a->diag; 18774dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18782e5835c6SStefano Zampini 187971f1c65dSBarry Smith mdiag = a->mdiag; 188071f1c65dSBarry Smith idiag = a->idiag; 18819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1882422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 188371f1c65dSBarry Smith for (i = 0; i < m; i++) { 188471f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1885899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1886899639b0SHong Zhang if (PetscRealPart(fshift)) { 18879566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 18887b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18897b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 18907b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 189198921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1892899639b0SHong Zhang } 189371f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 189471f1c65dSBarry Smith } 18959566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 189671f1c65dSBarry Smith } else { 189771f1c65dSBarry Smith for (i = 0; i < m; i++) { 189871f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 189971f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 190071f1c65dSBarry Smith } 19019566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 190271f1c65dSBarry Smith } 190371f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 190571f1c65dSBarry Smith PetscFunctionReturn(0); 190671f1c65dSBarry Smith } 190771f1c65dSBarry Smith 1908c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 1909d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1910d71ae5a4SJacob Faibussowitsch { 1911416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1912e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19132e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 191454f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19153d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 191697f1f81fSBarry Smith const PetscInt *idx, *diag; 191717ab2063SBarry Smith 19183a40ed3dSBarry Smith PetscFunctionBegin; 1919b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19209566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 1921b215bc84SStefano Zampini PetscFunctionReturn(0); 1922b215bc84SStefano Zampini } 1923b965ef7fSBarry Smith its = its * lits; 192491723122SBarry Smith 192571f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19269566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 192771f1c65dSBarry Smith a->fshift = fshift; 192871f1c65dSBarry Smith a->omega = omega; 1929ed480e8bSBarry Smith 193071f1c65dSBarry Smith diag = a->diag; 193171f1c65dSBarry Smith t = a->ssor_work; 1932ed480e8bSBarry Smith idiag = a->idiag; 193371f1c65dSBarry Smith mdiag = a->mdiag; 1934ed480e8bSBarry Smith 19359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19369566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19379566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1938ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 193917ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 194017ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1941ed480e8bSBarry Smith bs = b; 194217ab2063SBarry Smith for (i = 0; i < m; i++) { 194371f1c65dSBarry Smith d = fshift + mdiag[i]; 1944416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1945ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19462e5835c6SStefano Zampini v = aa + diag[i] + 1; 194717ab2063SBarry Smith sum = b[i] * d / omega; 1948003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 194917ab2063SBarry Smith x[i] = sum; 195017ab2063SBarry Smith } 19519566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19529566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19549566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19553a40ed3dSBarry Smith PetscFunctionReturn(0); 195617ab2063SBarry Smith } 1957c783ea89SBarry Smith 195808401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1959f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19604c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1961887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 196217ab2063SBarry Smith 196317ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 196417ab2063SBarry Smith 1965887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 196617ab2063SBarry Smith */ 196717ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 196817ab2063SBarry Smith 196917ab2063SBarry Smith /* x = (E + U)^{-1} b */ 197017ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1971416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1972ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19732e5835c6SStefano Zampini v = aa + diag[i] + 1; 197417ab2063SBarry Smith sum = b[i]; 1975e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1976ed480e8bSBarry Smith x[i] = sum * idiag[i]; 197717ab2063SBarry Smith } 197817ab2063SBarry Smith 197917ab2063SBarry Smith /* t = b - (2*E - D)x */ 19802e5835c6SStefano Zampini v = aa; 19812205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 198217ab2063SBarry Smith 198317ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1984ed480e8bSBarry Smith ts = t; 1985416022c9SBarry Smith diag = a->diag; 198617ab2063SBarry Smith for (i = 0; i < m; i++) { 1987416022c9SBarry Smith n = diag[i] - a->i[i]; 1988ed480e8bSBarry Smith idx = a->j + a->i[i]; 19892e5835c6SStefano Zampini v = aa + a->i[i]; 199017ab2063SBarry Smith sum = t[i]; 1991003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 1992ed480e8bSBarry Smith t[i] = sum * idiag[i]; 1993733d66baSBarry Smith /* x = x + t */ 1994733d66baSBarry Smith x[i] += t[i]; 199517ab2063SBarry Smith } 199617ab2063SBarry Smith 19979566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 19989566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19999566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20003a40ed3dSBarry Smith PetscFunctionReturn(0); 200117ab2063SBarry Smith } 200217ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 200317ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 200417ab2063SBarry Smith for (i = 0; i < m; i++) { 2005416022c9SBarry Smith n = diag[i] - a->i[i]; 2006ed480e8bSBarry Smith idx = a->j + a->i[i]; 20072e5835c6SStefano Zampini v = aa + a->i[i]; 200817ab2063SBarry Smith sum = b[i]; 2009e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20105c99c7daSBarry Smith t[i] = sum; 2011ed480e8bSBarry Smith x[i] = sum * idiag[i]; 201217ab2063SBarry Smith } 20135c99c7daSBarry Smith xb = t; 20149566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20153a40ed3dSBarry Smith } else xb = b; 201617ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 201717ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2018416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2019ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20202e5835c6SStefano Zampini v = aa + diag[i] + 1; 202117ab2063SBarry Smith sum = xb[i]; 2022e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20235c99c7daSBarry Smith if (xb == b) { 2024ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20255c99c7daSBarry Smith } else { 2026b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 202717ab2063SBarry Smith } 20285c99c7daSBarry Smith } 20299566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 203017ab2063SBarry Smith } 203117ab2063SBarry Smith its--; 203217ab2063SBarry Smith } 203317ab2063SBarry Smith while (its--) { 203417ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 203517ab2063SBarry Smith for (i = 0; i < m; i++) { 2036b19a5dc2SMark Adams /* lower */ 2037b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2038ed480e8bSBarry Smith idx = a->j + a->i[i]; 20392e5835c6SStefano Zampini v = aa + a->i[i]; 204017ab2063SBarry Smith sum = b[i]; 2041e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2042b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2043b19a5dc2SMark Adams /* upper */ 2044b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2045b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20462e5835c6SStefano Zampini v = aa + diag[i] + 1; 2047b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2048b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 204917ab2063SBarry Smith } 2050b19a5dc2SMark Adams xb = t; 20519566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2052b19a5dc2SMark Adams } else xb = b; 205317ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 205417ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2055b19a5dc2SMark Adams sum = xb[i]; 2056b19a5dc2SMark Adams if (xb == b) { 2057b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2058416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2059ed480e8bSBarry Smith idx = a->j + a->i[i]; 20602e5835c6SStefano Zampini v = aa + a->i[i]; 2061e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2062ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2063b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2064b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2065b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20662e5835c6SStefano Zampini v = aa + diag[i] + 1; 2067b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2068b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 206917ab2063SBarry Smith } 2070b19a5dc2SMark Adams } 2071b19a5dc2SMark Adams if (xb == b) { 20729566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2073b19a5dc2SMark Adams } else { 20749566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2075b19a5dc2SMark Adams } 207617ab2063SBarry Smith } 207717ab2063SBarry Smith } 20789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20799566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20809566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 2081365a8a9eSBarry Smith PetscFunctionReturn(0); 208217ab2063SBarry Smith } 208317ab2063SBarry Smith 2084d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2085d71ae5a4SJacob Faibussowitsch { 2086416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 20874e220ebcSLois Curfman McInnes 20883a40ed3dSBarry Smith PetscFunctionBegin; 20894e220ebcSLois Curfman McInnes info->block_size = 1.0; 20903966268fSBarry Smith info->nz_allocated = a->maxnz; 20913966268fSBarry Smith info->nz_used = a->nz; 20923966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 20933966268fSBarry Smith info->assemblies = A->num_ass; 20943966268fSBarry Smith info->mallocs = A->info.mallocs; 20954dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2096d5f3da31SBarry Smith if (A->factortype) { 20974e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 20984e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 20994e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21004e220ebcSLois Curfman McInnes } else { 21014e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21024e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21034e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21044e220ebcSLois Curfman McInnes } 21053a40ed3dSBarry Smith PetscFunctionReturn(0); 210617ab2063SBarry Smith } 210717ab2063SBarry Smith 2108d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2109d71ae5a4SJacob Faibussowitsch { 2110416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2111c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 211297b48c8fSBarry Smith const PetscScalar *xx; 21132e5835c6SStefano Zampini PetscScalar *bb, *aa; 2114c7da8527SEric Chamberland PetscInt d = 0; 211517ab2063SBarry Smith 21163a40ed3dSBarry Smith PetscFunctionBegin; 211797b48c8fSBarry Smith if (x && b) { 21189566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21199566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 212097b48c8fSBarry Smith for (i = 0; i < N; i++) { 2121aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2122447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 212397b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 212497b48c8fSBarry Smith } 21259566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21269566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 212797b48c8fSBarry Smith } 212897b48c8fSBarry Smith 21299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2130a9817697SBarry Smith if (a->keepnonzeropattern) { 2131f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2132aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21339566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2134f1e2ffcdSBarry Smith } 2135f4df32b1SMatthew Knepley if (diag != 0.0) { 2136c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2137c7da8527SEric Chamberland d = rows[i]; 2138447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 213908401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2140c7da8527SEric Chamberland } 2141f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2142447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21432e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2144f1e2ffcdSBarry Smith } 2145f1e2ffcdSBarry Smith } 2146f1e2ffcdSBarry Smith } else { 2147f4df32b1SMatthew Knepley if (diag != 0.0) { 214817ab2063SBarry Smith for (i = 0; i < N; i++) { 2149aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21507ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2151447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2152447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2153447d62f5SStefano Zampini } else { 2154416022c9SBarry Smith a->ilen[rows[i]] = 1; 21552e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2156bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2157447d62f5SStefano Zampini } 2158447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21599566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 216017ab2063SBarry Smith } 216117ab2063SBarry Smith } 21623a40ed3dSBarry Smith } else { 216317ab2063SBarry Smith for (i = 0; i < N; i++) { 2164aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2165416022c9SBarry Smith a->ilen[rows[i]] = 0; 216617ab2063SBarry Smith } 216717ab2063SBarry Smith } 2168e56f5c9eSBarry Smith A->nonzerostate++; 2169f1e2ffcdSBarry Smith } 21709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2171dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21723a40ed3dSBarry Smith PetscFunctionReturn(0); 217317ab2063SBarry Smith } 217417ab2063SBarry Smith 2175d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2176d71ae5a4SJacob Faibussowitsch { 21776e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21786e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21792b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 21806e169961SBarry Smith const PetscScalar *xx; 21812e5835c6SStefano Zampini PetscScalar *bb, *aa; 21826e169961SBarry Smith 21836e169961SBarry Smith PetscFunctionBegin; 21842e5835c6SStefano Zampini if (!N) PetscFunctionReturn(0); 21859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 21866e169961SBarry Smith if (x && b) { 21879566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21889566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 21892b40b63fSBarry Smith vecs = PETSC_TRUE; 21906e169961SBarry Smith } 21919566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 21926e169961SBarry Smith for (i = 0; i < N; i++) { 2193aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21949566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 21952205254eSKarl Rupp 21966e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 21976e169961SBarry Smith } 21986e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 21996e169961SBarry Smith if (!zeroed[i]) { 22006e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22014cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22022e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22032e5835c6SStefano Zampini aa[j] = 0.0; 22046e169961SBarry Smith } 22056e169961SBarry Smith } 22064cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22076e169961SBarry Smith } 22086e169961SBarry Smith if (x && b) { 22099566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22109566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22116e169961SBarry Smith } 22129566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22136e169961SBarry Smith if (diag != 0.0) { 22149566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22151d5a398dSstefano_zampini if (missing) { 22161d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22174cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2218aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22199566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22201d5a398dSstefano_zampini } 22211d5a398dSstefano_zampini } else { 2222ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22236e169961SBarry Smith } 22241d5a398dSstefano_zampini } 22259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2226dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22276e169961SBarry Smith PetscFunctionReturn(0); 22286e169961SBarry Smith } 22296e169961SBarry Smith 2230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2231d71ae5a4SJacob Faibussowitsch { 2232fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2233fff043a9SJunchao Zhang const PetscScalar *aa; 2234fff043a9SJunchao Zhang PetscInt *itmp; 223517ab2063SBarry Smith 22363a40ed3dSBarry Smith PetscFunctionBegin; 22379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2238416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22392e5835c6SStefano Zampini if (v) *v = (PetscScalar *)(aa + a->i[row]); 224017ab2063SBarry Smith if (idx) { 2241bfeeae90SHong Zhang itmp = a->j + a->i[row]; 224226fbe8dcSKarl Rupp if (*nz) *idx = itmp; 2243f4259b30SLisandro Dalcin else *idx = NULL; 224417ab2063SBarry Smith } 22459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22463a40ed3dSBarry Smith PetscFunctionReturn(0); 224717ab2063SBarry Smith } 224817ab2063SBarry Smith 2249d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2250d71ae5a4SJacob Faibussowitsch { 22513a40ed3dSBarry Smith PetscFunctionBegin; 2252cb4a9cd9SHong Zhang if (nz) *nz = 0; 22532e5835c6SStefano Zampini if (idx) *idx = NULL; 22542e5835c6SStefano Zampini if (v) *v = NULL; 22553a40ed3dSBarry Smith PetscFunctionReturn(0); 225617ab2063SBarry Smith } 225717ab2063SBarry Smith 2258d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2259d71ae5a4SJacob Faibussowitsch { 2260416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22612e5835c6SStefano Zampini const MatScalar *v; 226236db0b34SBarry Smith PetscReal sum = 0.0; 226397f1f81fSBarry Smith PetscInt i, j; 226417ab2063SBarry Smith 22653a40ed3dSBarry Smith PetscFunctionBegin; 22669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 226717ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2268570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2269570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2270792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2271570b7f6dSBarry Smith #else 2272416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22739371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22749371c9d4SSatish Balay v++; 227517ab2063SBarry Smith } 22768f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2277570b7f6dSBarry Smith #endif 22789566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22793a40ed3dSBarry Smith } else if (type == NORM_1) { 228036db0b34SBarry Smith PetscReal *tmp; 228197f1f81fSBarry Smith PetscInt *jj = a->j; 22829566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2283064f8208SBarry Smith *nrm = 0.0; 2284416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 22859371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 22869371c9d4SSatish Balay v++; 228717ab2063SBarry Smith } 2288d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2289064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 229017ab2063SBarry Smith } 22919566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 22929566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 22933a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2294064f8208SBarry Smith *nrm = 0.0; 2295d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 22962e5835c6SStefano Zampini const PetscScalar *v2 = v + a->i[j]; 229717ab2063SBarry Smith sum = 0.0; 2298416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 22999371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23009371c9d4SSatish Balay v2++; 230117ab2063SBarry Smith } 2302064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 230317ab2063SBarry Smith } 23049566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2305f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23073a40ed3dSBarry Smith PetscFunctionReturn(0); 230817ab2063SBarry Smith } 230917ab2063SBarry Smith 2310d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2311d71ae5a4SJacob Faibussowitsch { 23123d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 231354f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23142e5835c6SStefano Zampini const MatScalar *va, *vb; 231597f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2316cd0d46ebSvictorle 2317cd0d46ebSvictorle PetscFunctionBegin; 23189566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23199566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23205485867bSBarry Smith if (ma != nb || na != mb) { 23215485867bSBarry Smith *f = PETSC_FALSE; 23225485867bSBarry Smith PetscFunctionReturn(0); 23235485867bSBarry Smith } 23249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23269371c9d4SSatish Balay aii = aij->i; 23279371c9d4SSatish Balay bii = bij->i; 23289371c9d4SSatish Balay adx = aij->j; 23299371c9d4SSatish Balay bdx = bij->j; 23309566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23319566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2332cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2333cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2334cd0d46ebSvictorle 2335cd0d46ebSvictorle *f = PETSC_TRUE; 2336cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2337cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 233897f1f81fSBarry Smith PetscInt idc, idr; 23395485867bSBarry Smith PetscScalar vc, vr; 2340cd0d46ebSvictorle /* column/row index/value */ 23415485867bSBarry Smith idc = adx[aptr[i]]; 23425485867bSBarry Smith idr = bdx[bptr[idc]]; 23435485867bSBarry Smith vc = va[aptr[i]]; 23445485867bSBarry Smith vr = vb[bptr[idc]]; 23455485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23465485867bSBarry Smith *f = PETSC_FALSE; 23475485867bSBarry Smith goto done; 2348cd0d46ebSvictorle } else { 23495485867bSBarry Smith aptr[i]++; 23505485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2351cd0d46ebSvictorle } 2352cd0d46ebSvictorle } 2353cd0d46ebSvictorle } 2354cd0d46ebSvictorle done: 23559566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23569566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 2359cd0d46ebSvictorle PetscFunctionReturn(0); 2360cd0d46ebSvictorle } 2361cd0d46ebSvictorle 2362d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2363d71ae5a4SJacob Faibussowitsch { 23643d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 236554f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 236654f21887SBarry Smith MatScalar *va, *vb; 23671cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23681cbb95d3SBarry Smith 23691cbb95d3SBarry Smith PetscFunctionBegin; 23709566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23719566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23721cbb95d3SBarry Smith if (ma != nb || na != mb) { 23731cbb95d3SBarry Smith *f = PETSC_FALSE; 23741cbb95d3SBarry Smith PetscFunctionReturn(0); 23751cbb95d3SBarry Smith } 23769371c9d4SSatish Balay aii = aij->i; 23779371c9d4SSatish Balay bii = bij->i; 23789371c9d4SSatish Balay adx = aij->j; 23799371c9d4SSatish Balay bdx = bij->j; 23809371c9d4SSatish Balay va = aij->a; 23819371c9d4SSatish Balay vb = bij->a; 23829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23839566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23841cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 23851cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 23861cbb95d3SBarry Smith 23871cbb95d3SBarry Smith *f = PETSC_TRUE; 23881cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 23891cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 23901cbb95d3SBarry Smith PetscInt idc, idr; 23911cbb95d3SBarry Smith PetscScalar vc, vr; 23921cbb95d3SBarry Smith /* column/row index/value */ 23931cbb95d3SBarry Smith idc = adx[aptr[i]]; 23941cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 23951cbb95d3SBarry Smith vc = va[aptr[i]]; 23961cbb95d3SBarry Smith vr = vb[bptr[idc]]; 23971cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 23981cbb95d3SBarry Smith *f = PETSC_FALSE; 23991cbb95d3SBarry Smith goto done; 24001cbb95d3SBarry Smith } else { 24011cbb95d3SBarry Smith aptr[i]++; 24021cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24031cbb95d3SBarry Smith } 24041cbb95d3SBarry Smith } 24051cbb95d3SBarry Smith } 24061cbb95d3SBarry Smith done: 24079566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24089566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24091cbb95d3SBarry Smith PetscFunctionReturn(0); 24101cbb95d3SBarry Smith } 24111cbb95d3SBarry Smith 2412d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2413d71ae5a4SJacob Faibussowitsch { 24149e29f15eSvictorle PetscFunctionBegin; 24159566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f)); 24169e29f15eSvictorle PetscFunctionReturn(0); 24179e29f15eSvictorle } 24189e29f15eSvictorle 2419d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2420d71ae5a4SJacob Faibussowitsch { 24211cbb95d3SBarry Smith PetscFunctionBegin; 24229566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f)); 24231cbb95d3SBarry Smith PetscFunctionReturn(0); 24241cbb95d3SBarry Smith } 24251cbb95d3SBarry Smith 2426d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2427d71ae5a4SJacob Faibussowitsch { 2428416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2429fff8e43fSBarry Smith const PetscScalar *l, *r; 2430fff8e43fSBarry Smith PetscScalar x; 243154f21887SBarry Smith MatScalar *v; 2432fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2433fff8e43fSBarry Smith const PetscInt *jj; 243417ab2063SBarry Smith 24353a40ed3dSBarry Smith PetscFunctionBegin; 243617ab2063SBarry Smith if (ll) { 24373ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24383ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24399566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 244008401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24419566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 244317ab2063SBarry Smith for (i = 0; i < m; i++) { 244417ab2063SBarry Smith x = l[i]; 2445416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24462205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 244717ab2063SBarry Smith } 24489566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24499566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 245117ab2063SBarry Smith } 245217ab2063SBarry Smith if (rr) { 24539566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 245408401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24559566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24572e5835c6SStefano Zampini jj = a->j; 24582205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24609566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24619566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 246217ab2063SBarry Smith } 24639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24643a40ed3dSBarry Smith PetscFunctionReturn(0); 246517ab2063SBarry Smith } 246617ab2063SBarry Smith 2467d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2468d71ae5a4SJacob Faibussowitsch { 2469db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2470d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 247197f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24725d0c19d7SBarry Smith const PetscInt *irow, *icol; 24732e5835c6SStefano Zampini const PetscScalar *aa; 24745d0c19d7SBarry Smith PetscInt nrows, ncols; 247597f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 247654f21887SBarry Smith MatScalar *a_new, *mat_a; 2477416022c9SBarry Smith Mat C; 2478cdc6f3adSToby Isaac PetscBool stride; 247917ab2063SBarry Smith 24803a40ed3dSBarry Smith PetscFunctionBegin; 24819566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24829566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24839566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 248417ab2063SBarry Smith 24859566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2486ff718158SBarry Smith if (stride) { 24879566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2488ff718158SBarry Smith } else { 2489ff718158SBarry Smith first = 0; 2490ff718158SBarry Smith step = 0; 2491ff718158SBarry Smith } 2492fee21e36SBarry Smith if (stride && step == 1) { 249302834360SBarry Smith /* special case of contiguous rows */ 24949566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 249502834360SBarry Smith /* loop over new rows determining lens and starting points */ 249602834360SBarry Smith for (i = 0; i < nrows; i++) { 2497bfeeae90SHong Zhang kstart = ai[irow[i]]; 2498a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2499a91a9bebSLisandro Dalcin starts[i] = kstart; 250002834360SBarry Smith for (k = kstart; k < kend; k++) { 2501bfeeae90SHong Zhang if (aj[k] >= first) { 250202834360SBarry Smith starts[i] = k; 250302834360SBarry Smith break; 250402834360SBarry Smith } 250502834360SBarry Smith } 2506a2744918SBarry Smith sum = 0; 250702834360SBarry Smith while (k < kend) { 2508bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2509a2744918SBarry Smith sum++; 251002834360SBarry Smith } 2511a2744918SBarry Smith lens[i] = sum; 251202834360SBarry Smith } 251302834360SBarry Smith /* create submatrix */ 2514cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 251597f1f81fSBarry Smith PetscInt n_cols, n_rows; 25169566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2517aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25189566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 251908480c60SBarry Smith C = *B; 25203a40ed3dSBarry Smith } else { 25213bef6203SJed Brown PetscInt rbs, cbs; 25229566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25239566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25249566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25259566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25269566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25279566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 252908480c60SBarry Smith } 2530db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2531db02288aSLois Curfman McInnes 253202834360SBarry Smith /* loop over rows inserting into submatrix */ 2533db02288aSLois Curfman McInnes a_new = c->a; 2534db02288aSLois Curfman McInnes j_new = c->j; 2535db02288aSLois Curfman McInnes i_new = c->i; 25369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 253702834360SBarry Smith for (i = 0; i < nrows; i++) { 2538a2744918SBarry Smith ii = starts[i]; 2539a2744918SBarry Smith lensi = lens[i]; 2540ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25419566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2542a2744918SBarry Smith a_new += lensi; 2543a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2544a2744918SBarry Smith c->ilen[i] = lensi; 254502834360SBarry Smith } 25469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25479566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25483a40ed3dSBarry Smith } else { 25499566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25524dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25536bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25544dcab191SBarry Smith smap[icol[i]] = i + 1; 25554dcab191SBarry Smith } 25564dcab191SBarry Smith 255702834360SBarry Smith /* determine lens of each row */ 255802834360SBarry Smith for (i = 0; i < nrows; i++) { 2559bfeeae90SHong Zhang kstart = ai[irow[i]]; 256002834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 256102834360SBarry Smith lens[i] = 0; 256202834360SBarry Smith for (k = kstart; k < kend; k++) { 2563ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 256402834360SBarry Smith } 256502834360SBarry Smith } 256617ab2063SBarry Smith /* Create and fill new matrix */ 2567a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2568ace3abfcSBarry Smith PetscBool equal; 25690f5bd95cSBarry Smith 257099141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2571aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25729566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 257328b400f6SJacob Faibussowitsch PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong no of nonzeros"); 25749566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 257508480c60SBarry Smith C = *B; 25763a40ed3dSBarry Smith } else { 25773bef6203SJed Brown PetscInt rbs, cbs; 25789566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25799566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25809566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25819566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25829566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25839566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 258508480c60SBarry Smith } 25869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 258799141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 258817ab2063SBarry Smith for (i = 0; i < nrows; i++) { 258999141d43SSatish Balay row = irow[i]; 2590bfeeae90SHong Zhang kstart = ai[row]; 259199141d43SSatish Balay kend = kstart + a->ilen[row]; 2592bfeeae90SHong Zhang mat_i = c->i[i]; 259399141d43SSatish Balay mat_j = c->j + mat_i; 259499141d43SSatish Balay mat_a = c->a + mat_i; 259599141d43SSatish Balay mat_ilen = c->ilen + i; 259617ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2597bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2598ed480e8bSBarry Smith *mat_j++ = tcol - 1; 25992e5835c6SStefano Zampini *mat_a++ = aa[k]; 260099141d43SSatish Balay (*mat_ilen)++; 260117ab2063SBarry Smith } 260217ab2063SBarry Smith } 260317ab2063SBarry Smith } 26049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 260502834360SBarry Smith /* Free work space */ 26069566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26079566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26089566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2609cdc6f3adSToby Isaac /* sort */ 2610cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2611cdc6f3adSToby Isaac PetscInt ilen; 2612cdc6f3adSToby Isaac 2613cdc6f3adSToby Isaac mat_i = c->i[i]; 2614cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2615cdc6f3adSToby Isaac mat_a = c->a + mat_i; 2616cdc6f3adSToby Isaac ilen = c->ilen[i]; 26179566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2618cdc6f3adSToby Isaac } 261902834360SBarry Smith } 26208c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26219566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2622305c6ccfSStefano Zampini #endif 26239566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26249566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 262517ab2063SBarry Smith 26269566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2627416022c9SBarry Smith *B = C; 26283a40ed3dSBarry Smith PetscFunctionReturn(0); 262917ab2063SBarry Smith } 263017ab2063SBarry Smith 2631d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2632d71ae5a4SJacob Faibussowitsch { 263382d44351SHong Zhang Mat B; 263482d44351SHong Zhang 263582d44351SHong Zhang PetscFunctionBegin; 2636c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26379566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26389566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26399566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26409566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26419566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 264282d44351SHong Zhang *subMat = B; 2643c2d650bdSHong Zhang } else { 26449566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2645c2d650bdSHong Zhang } 264682d44351SHong Zhang PetscFunctionReturn(0); 264782d44351SHong Zhang } 264882d44351SHong Zhang 2649d71ae5a4SJacob Faibussowitsch PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2650d71ae5a4SJacob Faibussowitsch { 265163b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 265263b91edcSBarry Smith Mat outA; 2653ace3abfcSBarry Smith PetscBool row_identity, col_identity; 265463b91edcSBarry Smith 26553a40ed3dSBarry Smith PetscFunctionBegin; 265608401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26571df811f5SHong Zhang 26589566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26599566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2660a871dcd8SBarry Smith 266163b91edcSBarry Smith outA = inA; 2662d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26639566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26649566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26652205254eSKarl Rupp 26669566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26679566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26682205254eSKarl Rupp 2669c3122656SLisandro Dalcin a->row = row; 26702205254eSKarl Rupp 26719566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26729566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26732205254eSKarl Rupp 2674c3122656SLisandro Dalcin a->col = col; 267563b91edcSBarry Smith 267636db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26779566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26789566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2679f0ec6fceSSatish Balay 268094a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26819566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 268294a9d846SBarry Smith } 268363b91edcSBarry Smith 26849566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2685137fb511SHong Zhang if (row_identity && col_identity) { 26869566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2687137fb511SHong Zhang } else { 26889566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2689137fb511SHong Zhang } 26903a40ed3dSBarry Smith PetscFunctionReturn(0); 2691a871dcd8SBarry Smith } 2692a871dcd8SBarry Smith 2693d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2694d71ae5a4SJacob Faibussowitsch { 2695f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2696dfa0f9e5SStefano Zampini PetscScalar *v; 2697c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 26983a40ed3dSBarry Smith 26993a40ed3dSBarry Smith PetscFunctionBegin; 27009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27019566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2702792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27039566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27063a40ed3dSBarry Smith PetscFunctionReturn(0); 2707f0b747eeSBarry Smith } 2708f0b747eeSBarry Smith 2709d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2710d71ae5a4SJacob Faibussowitsch { 271116b64355SHong Zhang PetscInt i; 271216b64355SHong Zhang 271316b64355SHong Zhang PetscFunctionBegin; 271416b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27159566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 271616b64355SHong Zhang 271748a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27189566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 271916b64355SHong Zhang 272016b64355SHong Zhang if (submatj->rbuf1) { 27219566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27229566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 272316b64355SHong Zhang } 272416b64355SHong Zhang 272548a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27269566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27279566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 272816b64355SHong Zhang } 272916b64355SHong Zhang 273016b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 27319566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable *)&submatj->rmap)); 27329566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27339566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 273416b64355SHong Zhang #else 27359566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 273616b64355SHong Zhang #endif 273716b64355SHong Zhang 273816b64355SHong Zhang if (!submatj->allcolumns) { 273916b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 27409566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable *)&submatj->cmap)); 274116b64355SHong Zhang #else 27429566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 274316b64355SHong Zhang #endif 274416b64355SHong Zhang } 27459566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 274616b64355SHong Zhang 27479566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 274816b64355SHong Zhang PetscFunctionReturn(0); 274916b64355SHong Zhang } 275016b64355SHong Zhang 2751d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2752d71ae5a4SJacob Faibussowitsch { 275316b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27545c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 275516b64355SHong Zhang 275616b64355SHong Zhang PetscFunctionBegin; 27579566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27589566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 275916b64355SHong Zhang PetscFunctionReturn(0); 276016b64355SHong Zhang } 276116b64355SHong Zhang 276289a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2763d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2764d71ae5a4SJacob Faibussowitsch { 27652d033e1fSHong Zhang PetscInt i; 27660fb991dcSHong Zhang Mat C; 27670fb991dcSHong Zhang Mat_SeqAIJ *c; 27680fb991dcSHong Zhang Mat_SubSppt *submatj; 27692d033e1fSHong Zhang 27702d033e1fSHong Zhang PetscFunctionBegin; 27712d033e1fSHong Zhang for (i = 0; i < n; i++) { 27720fb991dcSHong Zhang C = (*mat)[i]; 27730fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27740fb991dcSHong Zhang submatj = c->submatis1; 27752d033e1fSHong Zhang if (submatj) { 2776682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 277726cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27789566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27799566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27809566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27813faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27829566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27839566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27849566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2785682e4c99SStefano Zampini } 27862d033e1fSHong Zhang } else { 27879566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 27882d033e1fSHong Zhang } 27892d033e1fSHong Zhang } 279086e85357SHong Zhang 279163a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 27929566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 279363a75b2aSHong Zhang 27949566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 27952d033e1fSHong Zhang PetscFunctionReturn(0); 27962d033e1fSHong Zhang } 27972d033e1fSHong Zhang 2798d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2799d71ae5a4SJacob Faibussowitsch { 280097f1f81fSBarry Smith PetscInt i; 2801cddf8d76SBarry Smith 28023a40ed3dSBarry Smith PetscFunctionBegin; 280348a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2804cddf8d76SBarry Smith 280548a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28063a40ed3dSBarry Smith PetscFunctionReturn(0); 2807cddf8d76SBarry Smith } 2808cddf8d76SBarry Smith 2809d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2810d71ae5a4SJacob Faibussowitsch { 2811e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2812*9a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28135d0c19d7SBarry Smith const PetscInt *idx; 2814*9a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2815f1af5d2fSBarry Smith PetscBT table; 2816bbd702dbSSatish Balay 28173a40ed3dSBarry Smith PetscFunctionBegin; 2818*9a88ca10SBarry Smith m = A->rmap->n / bs; 2819e4d965acSSatish Balay ai = a->i; 2820bfeeae90SHong Zhang aj = a->j; 28218a047759SSatish Balay 282208401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 282306763907SSatish Balay 28249566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28259566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 282606763907SSatish Balay 2827e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2828b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2829e4d965acSSatish Balay isz = 0; 28309566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2831e4d965acSSatish Balay 2832e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28339566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28349566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2835e4d965acSSatish Balay 2836*9a88ca10SBarry Smith if (bs > 1) { 2837*9a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2838*9a88ca10SBarry Smith for (j = 0; j < n; ++j) { 2839*9a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 2840*9a88ca10SBarry Smith } 2841*9a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 2842*9a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 2843*9a88ca10SBarry Smith 2844*9a88ca10SBarry Smith k = 0; 2845*9a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 2846*9a88ca10SBarry Smith n = isz; 2847*9a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2848*9a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 2849*9a88ca10SBarry Smith row = bs * nidx[k] + ll; 2850*9a88ca10SBarry Smith start = ai[row]; 2851*9a88ca10SBarry Smith end = ai[row + 1]; 2852*9a88ca10SBarry Smith for (l = start; l < end; l++) { 2853*9a88ca10SBarry Smith val = aj[l] / bs; 2854*9a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2855*9a88ca10SBarry Smith } 2856*9a88ca10SBarry Smith } 2857*9a88ca10SBarry Smith } 2858*9a88ca10SBarry Smith } 2859*9a88ca10SBarry Smith PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2860*9a88ca10SBarry Smith } else { 2861dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2862e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28632205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28644dcbc457SBarry Smith } 28659566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28669566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2867e4d965acSSatish Balay 286804a348a9SBarry Smith k = 0; 286904a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 287004a348a9SBarry Smith n = isz; 287106763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2872e4d965acSSatish Balay row = nidx[k]; 2873e4d965acSSatish Balay start = ai[row]; 2874e4d965acSSatish Balay end = ai[row + 1]; 287504a348a9SBarry Smith for (l = start; l < end; l++) { 2876efb16452SHong Zhang val = aj[l]; 28772205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2878e4d965acSSatish Balay } 2879e4d965acSSatish Balay } 2880e4d965acSSatish Balay } 28819566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2882e4d965acSSatish Balay } 2883*9a88ca10SBarry Smith } 28849566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28859566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28863a40ed3dSBarry Smith PetscFunctionReturn(0); 28874dcbc457SBarry Smith } 288817ab2063SBarry Smith 28890513a670SBarry Smith /* -------------------------------------------------------------- */ 2890d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2891d71ae5a4SJacob Faibussowitsch { 28920513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28933b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 28945d0c19d7SBarry Smith const PetscInt *row, *col; 28955d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 289656cd22aeSBarry Smith IS icolp, irowp; 28970298fd71SBarry Smith PetscInt *cwork = NULL; 28980298fd71SBarry Smith PetscScalar *vwork = NULL; 28990513a670SBarry Smith 29003a40ed3dSBarry Smith PetscFunctionBegin; 29019566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29029566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29039566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29049566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29050513a670SBarry Smith 29060513a670SBarry Smith /* determine lengths of permuted rows */ 29079566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29082205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29099566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29109566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29119566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29129566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29149566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29150513a670SBarry Smith 29169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29170513a670SBarry Smith for (i = 0; i < m; i++) { 29189566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29192205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29209566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29219566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29220513a670SBarry Smith } 29239566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29242205254eSKarl Rupp 29253c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29262205254eSKarl Rupp 29278c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29289566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29299fe5e383SStefano Zampini #endif 29309566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29319566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29329566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29339566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29349566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29359566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 293648a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29373a40ed3dSBarry Smith PetscFunctionReturn(0); 29380513a670SBarry Smith } 29390513a670SBarry Smith 2940d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2941d71ae5a4SJacob Faibussowitsch { 2942cb5b572fSBarry Smith PetscFunctionBegin; 294333f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 294433f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2945be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2946be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29472e5835c6SStefano Zampini const PetscScalar *aa; 2948be6bf707SBarry Smith 29499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 295008401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29519566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29529566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2954cb5b572fSBarry Smith } else { 29559566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2956cb5b572fSBarry Smith } 2957cb5b572fSBarry Smith PetscFunctionReturn(0); 2958cb5b572fSBarry Smith } 2959cb5b572fSBarry Smith 2960d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetUp_SeqAIJ(Mat A) 2961d71ae5a4SJacob Faibussowitsch { 2962273d9f13SBarry Smith PetscFunctionBegin; 29639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, PETSC_DEFAULT, NULL)); 2964273d9f13SBarry Smith PetscFunctionReturn(0); 2965273d9f13SBarry Smith } 2966273d9f13SBarry Smith 2967d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2968d71ae5a4SJacob Faibussowitsch { 29696c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29706e111a19SKarl Rupp 29716c0721eeSBarry Smith PetscFunctionBegin; 29726c0721eeSBarry Smith *array = a->a; 29736c0721eeSBarry Smith PetscFunctionReturn(0); 29746c0721eeSBarry Smith } 29756c0721eeSBarry Smith 2976d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2977d71ae5a4SJacob Faibussowitsch { 29786c0721eeSBarry Smith PetscFunctionBegin; 2979f38c1e66SStefano Zampini *array = NULL; 29806c0721eeSBarry Smith PetscFunctionReturn(0); 29816c0721eeSBarry Smith } 2982273d9f13SBarry Smith 29838229c054SShri Abhyankar /* 29848229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29858229c054SShri Abhyankar have different nonzero structure. 29868229c054SShri Abhyankar */ 2987d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2988d71ae5a4SJacob Faibussowitsch { 2989b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2990ec7775f6SShri Abhyankar 2991ec7775f6SShri Abhyankar PetscFunctionBegin; 2992ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2993ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 2994b264fe52SHong Zhang const PetscInt *xjj = xj + xi[i], *yjj = yj + yi[i]; 2995b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 2996b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 29978af7cee1SJed Brown nnz[i] = 0; 29988af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 2999b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 3000b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 30018af7cee1SJed Brown nnz[i]++; 30028af7cee1SJed Brown } 30038af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 3004ec7775f6SShri Abhyankar } 3005ec7775f6SShri Abhyankar PetscFunctionReturn(0); 3006ec7775f6SShri Abhyankar } 3007ec7775f6SShri Abhyankar 3008d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3009d71ae5a4SJacob Faibussowitsch { 3010b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3011b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3012b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3013b264fe52SHong Zhang 3014b264fe52SHong Zhang PetscFunctionBegin; 3015b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30169566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 3017b264fe52SHong Zhang PetscFunctionReturn(0); 3018b264fe52SHong Zhang } 3019b264fe52SHong Zhang 3020d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3021d71ae5a4SJacob Faibussowitsch { 3022ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3023ac90fabeSBarry Smith 3024ac90fabeSBarry Smith PetscFunctionBegin; 3025134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3026134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3027134adf20SPierre Jolivet if (e) { 30289566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 302981fa06acSBarry Smith if (e) { 30309566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3031134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 303281fa06acSBarry Smith } 303381fa06acSBarry Smith } 303454c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 303581fa06acSBarry Smith } 3036ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30372e5835c6SStefano Zampini const PetscScalar *xa; 30382e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 303981fa06acSBarry Smith PetscBLASInt one = 1, bnz; 304081fa06acSBarry Smith 30419566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3044792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30479566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30499566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3050ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30519566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3052ac90fabeSBarry Smith } else { 30538229c054SShri Abhyankar Mat B; 30548229c054SShri Abhyankar PetscInt *nnz; 30559566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30569566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30579566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30589566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30599566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30609566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30629566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30639566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30649bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30659566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3066ac90fabeSBarry Smith } 3067ac90fabeSBarry Smith PetscFunctionReturn(0); 3068ac90fabeSBarry Smith } 3069ac90fabeSBarry Smith 3070d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3071d71ae5a4SJacob Faibussowitsch { 3072354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3073354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3074354c94deSBarry Smith PetscInt i, nz; 3075354c94deSBarry Smith PetscScalar *a; 3076354c94deSBarry Smith 3077354c94deSBarry Smith PetscFunctionBegin; 3078354c94deSBarry Smith nz = aij->nz; 30799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30802205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3082354c94deSBarry Smith #else 3083354c94deSBarry Smith PetscFunctionBegin; 3084354c94deSBarry Smith #endif 3085354c94deSBarry Smith PetscFunctionReturn(0); 3086354c94deSBarry Smith } 3087354c94deSBarry Smith 3088d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3089d71ae5a4SJacob Faibussowitsch { 3090e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3091d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3092e34fafa9SBarry Smith PetscReal atmp; 3093985db425SBarry Smith PetscScalar *x; 3094ce496241SStefano Zampini const MatScalar *aa, *av; 3095e34fafa9SBarry Smith 3096e34fafa9SBarry Smith PetscFunctionBegin; 309728b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 30989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3099ce496241SStefano Zampini aa = av; 3100e34fafa9SBarry Smith ai = a->i; 3101e34fafa9SBarry Smith aj = a->j; 3102e34fafa9SBarry Smith 31039566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31049566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31059566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 310608401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3107e34fafa9SBarry Smith for (i = 0; i < m; i++) { 31089371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31099371c9d4SSatish Balay ai++; 3110e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3111985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31129371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31139371c9d4SSatish Balay x[i] = atmp; 31149371c9d4SSatish Balay if (idx) idx[i] = *aj; 31159371c9d4SSatish Balay } 31169371c9d4SSatish Balay aa++; 31179371c9d4SSatish Balay aj++; 3118985db425SBarry Smith } 3119985db425SBarry Smith } 31209566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3122985db425SBarry Smith PetscFunctionReturn(0); 3123985db425SBarry Smith } 3124985db425SBarry Smith 3125d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3126d71ae5a4SJacob Faibussowitsch { 3127985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3128d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3129985db425SBarry Smith PetscScalar *x; 3130ce496241SStefano Zampini const MatScalar *aa, *av; 3131985db425SBarry Smith 3132985db425SBarry Smith PetscFunctionBegin; 313328b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3135ce496241SStefano Zampini aa = av; 3136985db425SBarry Smith ai = a->i; 3137985db425SBarry Smith aj = a->j; 3138985db425SBarry Smith 31399566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31409566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31419566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 314208401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3143985db425SBarry Smith for (i = 0; i < m; i++) { 31449371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31459371c9d4SSatish Balay ai++; 3146d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31479371c9d4SSatish Balay x[i] = *aa; 31489371c9d4SSatish Balay if (idx) idx[i] = 0; 3149985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3150985db425SBarry Smith x[i] = 0.0; 3151985db425SBarry Smith if (idx) { 3152985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3153985db425SBarry Smith if (aj[j] > j) { 3154985db425SBarry Smith idx[i] = j; 3155985db425SBarry Smith break; 3156985db425SBarry Smith } 3157985db425SBarry Smith } 31581a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31591a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3160985db425SBarry Smith } 3161985db425SBarry Smith } 3162985db425SBarry Smith for (j = 0; j < ncols; j++) { 31639371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31649371c9d4SSatish Balay x[i] = *aa; 31659371c9d4SSatish Balay if (idx) idx[i] = *aj; 31669371c9d4SSatish Balay } 31679371c9d4SSatish Balay aa++; 31689371c9d4SSatish Balay aj++; 3169985db425SBarry Smith } 3170985db425SBarry Smith } 31719566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3173985db425SBarry Smith PetscFunctionReturn(0); 3174985db425SBarry Smith } 3175985db425SBarry Smith 3176d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3177d71ae5a4SJacob Faibussowitsch { 3178c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3179c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3180ce496241SStefano Zampini PetscScalar *x; 3181ce496241SStefano Zampini const MatScalar *aa, *av; 3182c87e5d42SMatthew Knepley 3183c87e5d42SMatthew Knepley PetscFunctionBegin; 31849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3185ce496241SStefano Zampini aa = av; 3186c87e5d42SMatthew Knepley ai = a->i; 3187c87e5d42SMatthew Knepley aj = a->j; 3188c87e5d42SMatthew Knepley 31899566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31909566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31919566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 319208401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3193c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 31949371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31959371c9d4SSatish Balay ai++; 3196f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 31979371c9d4SSatish Balay x[i] = *aa; 31989371c9d4SSatish Balay if (idx) idx[i] = 0; 3199f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3200f07e67edSHong Zhang x[i] = 0.0; 3201f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3202289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3203f07e67edSHong Zhang if (aj[j] > j) { 3204f07e67edSHong Zhang idx[i] = j; 32052205254eSKarl Rupp break; 32062205254eSKarl Rupp } 3207289a08f5SMatthew Knepley } 3208f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3209f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3210f07e67edSHong Zhang } 3211289a08f5SMatthew Knepley } 3212c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32139371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32149371c9d4SSatish Balay x[i] = *aa; 32159371c9d4SSatish Balay if (idx) idx[i] = *aj; 32169371c9d4SSatish Balay } 32179371c9d4SSatish Balay aa++; 32189371c9d4SSatish Balay aj++; 3219c87e5d42SMatthew Knepley } 3220c87e5d42SMatthew Knepley } 32219566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3223c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3224c87e5d42SMatthew Knepley } 3225c87e5d42SMatthew Knepley 3226d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3227d71ae5a4SJacob Faibussowitsch { 3228985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3229d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3230d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3231985db425SBarry Smith PetscScalar *x; 3232ce496241SStefano Zampini const MatScalar *aa, *av; 3233985db425SBarry Smith 3234985db425SBarry Smith PetscFunctionBegin; 323528b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3237ce496241SStefano Zampini aa = av; 3238985db425SBarry Smith ai = a->i; 3239985db425SBarry Smith aj = a->j; 3240985db425SBarry Smith 32419566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32429566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32439566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 324408401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3245985db425SBarry Smith for (i = 0; i < m; i++) { 32469371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32479371c9d4SSatish Balay ai++; 3248d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32499371c9d4SSatish Balay x[i] = *aa; 32509371c9d4SSatish Balay if (idx) idx[i] = 0; 3251985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3252985db425SBarry Smith x[i] = 0.0; 3253985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3254985db425SBarry Smith for (j = 0; j < ncols; j++) { 3255985db425SBarry Smith if (aj[j] > j) { 3256985db425SBarry Smith idx[i] = j; 3257985db425SBarry Smith break; 3258985db425SBarry Smith } 3259985db425SBarry Smith } 3260fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3261fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3262985db425SBarry Smith } 3263985db425SBarry Smith } 3264985db425SBarry Smith for (j = 0; j < ncols; j++) { 32659371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32669371c9d4SSatish Balay x[i] = *aa; 32679371c9d4SSatish Balay if (idx) idx[i] = *aj; 32689371c9d4SSatish Balay } 32699371c9d4SSatish Balay aa++; 32709371c9d4SSatish Balay aj++; 3271e34fafa9SBarry Smith } 3272e34fafa9SBarry Smith } 32739566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3275e34fafa9SBarry Smith PetscFunctionReturn(0); 3276e34fafa9SBarry Smith } 3277bbead8a2SBarry Smith 3278d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3279d71ae5a4SJacob Faibussowitsch { 3280bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 328133d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3282bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 32830da83c2eSBarry Smith const PetscReal shift = 0.0; 32841a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3285bbead8a2SBarry Smith 3286bbead8a2SBarry Smith PetscFunctionBegin; 3287a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 32884a0d0026SBarry Smith if (a->ibdiagvalid) { 32894a0d0026SBarry Smith if (values) *values = a->ibdiag; 32904a0d0026SBarry Smith PetscFunctionReturn(0); 32914a0d0026SBarry Smith } 32929566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 32934dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3294bbead8a2SBarry Smith diag = a->ibdiag; 3295bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3296bbead8a2SBarry Smith /* factor and invert each block */ 3297bbead8a2SBarry Smith switch (bs) { 3298bbead8a2SBarry Smith case 1: 3299bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33009566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3301ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3302ec1892c8SHong Zhang if (allowzeropivot) { 33037b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33047b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33057b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33069566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 330798921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3308ec1892c8SHong Zhang } 3309bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3310bbead8a2SBarry Smith } 3311bbead8a2SBarry Smith break; 3312bbead8a2SBarry Smith case 2: 3313bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33149371c9d4SSatish Balay ij[0] = 2 * i; 33159371c9d4SSatish Balay ij[1] = 2 * i + 1; 33169566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33179566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33187b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33199566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3320bbead8a2SBarry Smith diag += 4; 3321bbead8a2SBarry Smith } 3322bbead8a2SBarry Smith break; 3323bbead8a2SBarry Smith case 3: 3324bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33259371c9d4SSatish Balay ij[0] = 3 * i; 33269371c9d4SSatish Balay ij[1] = 3 * i + 1; 33279371c9d4SSatish Balay ij[2] = 3 * i + 2; 33289566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33299566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33307b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33319566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3332bbead8a2SBarry Smith diag += 9; 3333bbead8a2SBarry Smith } 3334bbead8a2SBarry Smith break; 3335bbead8a2SBarry Smith case 4: 3336bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33379371c9d4SSatish Balay ij[0] = 4 * i; 33389371c9d4SSatish Balay ij[1] = 4 * i + 1; 33399371c9d4SSatish Balay ij[2] = 4 * i + 2; 33409371c9d4SSatish Balay ij[3] = 4 * i + 3; 33419566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33429566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33437b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33449566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3345bbead8a2SBarry Smith diag += 16; 3346bbead8a2SBarry Smith } 3347bbead8a2SBarry Smith break; 3348bbead8a2SBarry Smith case 5: 3349bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33509371c9d4SSatish Balay ij[0] = 5 * i; 33519371c9d4SSatish Balay ij[1] = 5 * i + 1; 33529371c9d4SSatish Balay ij[2] = 5 * i + 2; 33539371c9d4SSatish Balay ij[3] = 5 * i + 3; 33549371c9d4SSatish Balay ij[4] = 5 * i + 4; 33559566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33569566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33577b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33589566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3359bbead8a2SBarry Smith diag += 25; 3360bbead8a2SBarry Smith } 3361bbead8a2SBarry Smith break; 3362bbead8a2SBarry Smith case 6: 3363bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33649371c9d4SSatish Balay ij[0] = 6 * i; 33659371c9d4SSatish Balay ij[1] = 6 * i + 1; 33669371c9d4SSatish Balay ij[2] = 6 * i + 2; 33679371c9d4SSatish Balay ij[3] = 6 * i + 3; 33689371c9d4SSatish Balay ij[4] = 6 * i + 4; 33699371c9d4SSatish Balay ij[5] = 6 * i + 5; 33709566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33719566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33727b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33739566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3374bbead8a2SBarry Smith diag += 36; 3375bbead8a2SBarry Smith } 3376bbead8a2SBarry Smith break; 3377bbead8a2SBarry Smith case 7: 3378bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33799371c9d4SSatish Balay ij[0] = 7 * i; 33809371c9d4SSatish Balay ij[1] = 7 * i + 1; 33819371c9d4SSatish Balay ij[2] = 7 * i + 2; 33829371c9d4SSatish Balay ij[3] = 7 * i + 3; 33839371c9d4SSatish Balay ij[4] = 7 * i + 4; 33849371c9d4SSatish Balay ij[5] = 7 * i + 5; 33859371c9d4SSatish Balay ij[5] = 7 * i + 6; 33869566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 33879566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 33887b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33899566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3390bbead8a2SBarry Smith diag += 49; 3391bbead8a2SBarry Smith } 3392bbead8a2SBarry Smith break; 3393bbead8a2SBarry Smith default: 33949566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3395bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3396ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 33979566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 33989566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 33997b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34009566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3401bbead8a2SBarry Smith diag += bs2; 3402bbead8a2SBarry Smith } 34039566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3404bbead8a2SBarry Smith } 3405bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3406bbead8a2SBarry Smith PetscFunctionReturn(0); 3407bbead8a2SBarry Smith } 3408bbead8a2SBarry Smith 3409d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3410d71ae5a4SJacob Faibussowitsch { 341173a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3412fff043a9SJunchao Zhang PetscScalar a, *aa; 341373a71a0fSBarry Smith PetscInt m, n, i, j, col; 341473a71a0fSBarry Smith 341573a71a0fSBarry Smith PetscFunctionBegin; 341673a71a0fSBarry Smith if (!x->assembled) { 34179566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 341873a71a0fSBarry Smith for (i = 0; i < m; i++) { 341973a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34209566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 342173a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34229566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 342373a71a0fSBarry Smith } 342473a71a0fSBarry Smith } 3425e2ce353bSJunchao Zhang } else { 34269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34279566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3429e2ce353bSJunchao Zhang } 34309566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34319566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 343273a71a0fSBarry Smith PetscFunctionReturn(0); 343373a71a0fSBarry Smith } 343473a71a0fSBarry Smith 3435679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3436d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3437d71ae5a4SJacob Faibussowitsch { 3438679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3439679944adSJunchao Zhang PetscScalar a; 3440679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3441679944adSJunchao Zhang 3442679944adSJunchao Zhang PetscFunctionBegin; 3443679944adSJunchao Zhang nskip = high - low; 34449566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3445679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3446679944adSJunchao Zhang for (i = 0; i < m; i++) { 3447679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34489566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3449679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3450679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34519566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3452679944adSJunchao Zhang } 3453e2ce353bSJunchao Zhang } 34549566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34559566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 3456679944adSJunchao Zhang PetscFunctionReturn(0); 3457679944adSJunchao Zhang } 3458679944adSJunchao Zhang 3459682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 34600a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3461cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3462cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3463cb5b572fSBarry Smith MatMult_SeqAIJ, 346497304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34657c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34667c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3467f4259b30SLisandro Dalcin NULL, 3468f4259b30SLisandro Dalcin NULL, 3469f4259b30SLisandro Dalcin NULL, 3470f4259b30SLisandro Dalcin /* 10*/ NULL, 3471cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3472f4259b30SLisandro Dalcin NULL, 347341f059aeSBarry Smith MatSOR_SeqAIJ, 347491e9d3e2SHong Zhang MatTranspose_SeqAIJ, 347597304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3476cb5b572fSBarry Smith MatEqual_SeqAIJ, 3477cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3478cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3479cb5b572fSBarry Smith MatNorm_SeqAIJ, 3480f4259b30SLisandro Dalcin /* 20*/ NULL, 3481cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3482cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3483cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3484d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3485f4259b30SLisandro Dalcin NULL, 3486f4259b30SLisandro Dalcin NULL, 3487f4259b30SLisandro Dalcin NULL, 3488f4259b30SLisandro Dalcin NULL, 34894994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3490f4259b30SLisandro Dalcin NULL, 3491f4259b30SLisandro Dalcin NULL, 3492f4259b30SLisandro Dalcin NULL, 3493f4259b30SLisandro Dalcin NULL, 3494d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3495f4259b30SLisandro Dalcin NULL, 3496f4259b30SLisandro Dalcin NULL, 3497cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3498f4259b30SLisandro Dalcin NULL, 3499d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35007dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3501cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3502cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3503cb5b572fSBarry Smith MatCopy_SeqAIJ, 3504d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3505cb5b572fSBarry Smith MatScale_SeqAIJ, 35067d68702bSBarry Smith MatShift_SeqAIJ, 350779299369SBarry Smith MatDiagonalSet_SeqAIJ, 35086e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 350973a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35103b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35113b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35123b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3513a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 351493dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3515f4259b30SLisandro Dalcin NULL, 3516f4259b30SLisandro Dalcin NULL, 3517cda55fadSBarry Smith MatPermute_SeqAIJ, 3518f4259b30SLisandro Dalcin NULL, 3519f4259b30SLisandro Dalcin /* 59*/ NULL, 3520b9b97703SBarry Smith MatDestroy_SeqAIJ, 3521b9b97703SBarry Smith MatView_SeqAIJ, 3522f4259b30SLisandro Dalcin NULL, 3523f4259b30SLisandro Dalcin NULL, 3524f4259b30SLisandro Dalcin /* 64*/ NULL, 3525321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3526f4259b30SLisandro Dalcin NULL, 3527f4259b30SLisandro Dalcin NULL, 3528f4259b30SLisandro Dalcin NULL, 3529d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3530c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3531f4259b30SLisandro Dalcin NULL, 3532f4259b30SLisandro Dalcin NULL, 3533f4259b30SLisandro Dalcin NULL, 3534f4259b30SLisandro Dalcin /* 74*/ NULL, 35353acb8795SBarry Smith MatFDColoringApply_AIJ, 3536f4259b30SLisandro Dalcin NULL, 3537f4259b30SLisandro Dalcin NULL, 3538f4259b30SLisandro Dalcin NULL, 35396ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3540f4259b30SLisandro Dalcin NULL, 3541f4259b30SLisandro Dalcin NULL, 3542f4259b30SLisandro Dalcin NULL, 3543bc011b1eSHong Zhang MatLoad_SeqAIJ, 3544d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35451cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3546f4259b30SLisandro Dalcin NULL, 3547f4259b30SLisandro Dalcin NULL, 3548f4259b30SLisandro Dalcin NULL, 3549f4259b30SLisandro Dalcin /* 89*/ NULL, 3550f4259b30SLisandro Dalcin NULL, 355126be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3552f4259b30SLisandro Dalcin NULL, 3553f4259b30SLisandro Dalcin NULL, 35548fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3555f4259b30SLisandro Dalcin NULL, 3556f4259b30SLisandro Dalcin NULL, 35576fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3558f4259b30SLisandro Dalcin NULL, 35594222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3560f4259b30SLisandro Dalcin NULL, 3561f4259b30SLisandro Dalcin NULL, 356287d4246cSBarry Smith MatConjugate_SeqAIJ, 3563f4259b30SLisandro Dalcin NULL, 3564d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 356599cafbc1SBarry Smith MatRealPart_SeqAIJ, 3566f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3567f4259b30SLisandro Dalcin NULL, 3568f4259b30SLisandro Dalcin NULL, 3569cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3570f4259b30SLisandro Dalcin NULL, 35712af78befSBarry Smith MatGetRowMin_SeqAIJ, 3572f4259b30SLisandro Dalcin NULL, 3573599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3574f4259b30SLisandro Dalcin /*114*/ NULL, 3575f4259b30SLisandro Dalcin NULL, 3576f4259b30SLisandro Dalcin NULL, 3577f4259b30SLisandro Dalcin NULL, 3578f4259b30SLisandro Dalcin NULL, 3579f4259b30SLisandro Dalcin /*119*/ NULL, 3580f4259b30SLisandro Dalcin NULL, 3581f4259b30SLisandro Dalcin NULL, 3582f4259b30SLisandro Dalcin NULL, 3583b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 35840716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3585a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 358637868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 35870da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3588f4259b30SLisandro Dalcin NULL, 3589f4259b30SLisandro Dalcin /*129*/ NULL, 3590f4259b30SLisandro Dalcin NULL, 3591f4259b30SLisandro Dalcin NULL, 359275648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3593b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3594b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 35952b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3596f4259b30SLisandro Dalcin NULL, 3597f4259b30SLisandro Dalcin NULL, 35983964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3599f4259b30SLisandro Dalcin /*139*/ NULL, 3600f4259b30SLisandro Dalcin NULL, 3601f4259b30SLisandro Dalcin NULL, 36023a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36039c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36044222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36054222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3606f4259b30SLisandro Dalcin NULL, 360772833a62Smarkadams4 NULL, 360872833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36092d776b49SBarry Smith NULL, 36109371c9d4SSatish Balay /*150*/ MatTransposeSymbolic_SeqAIJ}; 361117ab2063SBarry Smith 3612d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3613d71ae5a4SJacob Faibussowitsch { 3614bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 361597f1f81fSBarry Smith PetscInt i, nz, n; 3616bef8e0ddSBarry Smith 3617bef8e0ddSBarry Smith PetscFunctionBegin; 3618bef8e0ddSBarry Smith nz = aij->maxnz; 3619d0f46423SBarry Smith n = mat->rmap->n; 3620ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3621bef8e0ddSBarry Smith aij->nz = nz; 3622ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 3623bef8e0ddSBarry Smith PetscFunctionReturn(0); 3624bef8e0ddSBarry Smith } 3625bef8e0ddSBarry Smith 3626a3bb6f32SFande Kong /* 3627ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3628ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3629ddea5d60SJunchao Zhang */ 3630d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3631d71ae5a4SJacob Faibussowitsch { 3632a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3633a3bb6f32SFande Kong PetscTable gid1_lid1; 3634a3bb6f32SFande Kong PetscTablePosition tpos; 363525b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 363625b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3637a3bb6f32SFande Kong 3638a3bb6f32SFande Kong PetscFunctionBegin; 3639a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3640a3bb6f32SFande Kong PetscValidPointer(mapping, 2); 3641a3bb6f32SFande Kong /* use a table */ 36429566063dSJacob Faibussowitsch PetscCall(PetscTableCreate(mat->rmap->n, mat->cmap->N + 1, &gid1_lid1)); 3643a3bb6f32SFande Kong ec = 0; 364425b670f0SStefano Zampini for (i = 0; i < nz; i++) { 364525b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 36469566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1, gid1, &data)); 3647a3bb6f32SFande Kong if (!data) { 3648a3bb6f32SFande Kong /* one based table */ 36499566063dSJacob Faibussowitsch PetscCall(PetscTableAdd(gid1_lid1, gid1, ++ec, INSERT_VALUES)); 3650a3bb6f32SFande Kong } 3651a3bb6f32SFande Kong } 3652a3bb6f32SFande Kong /* form array of columns we need */ 36539566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 36549566063dSJacob Faibussowitsch PetscCall(PetscTableGetHeadPosition(gid1_lid1, &tpos)); 3655a3bb6f32SFande Kong while (tpos) { 36569566063dSJacob Faibussowitsch PetscCall(PetscTableGetNext(gid1_lid1, &tpos, &gid, &lid)); 3657a3bb6f32SFande Kong gid--; 3658a3bb6f32SFande Kong lid--; 3659a3bb6f32SFande Kong garray[lid] = gid; 3660a3bb6f32SFande Kong } 36619566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 36629566063dSJacob Faibussowitsch PetscCall(PetscTableRemoveAll(gid1_lid1)); 366348a46eb9SPierre Jolivet for (i = 0; i < ec; i++) PetscCall(PetscTableAdd(gid1_lid1, garray[i] + 1, i + 1, INSERT_VALUES)); 3664a3bb6f32SFande Kong /* compact out the extra columns in B */ 366525b670f0SStefano Zampini for (i = 0; i < nz; i++) { 366625b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 36679566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1, gid1, &lid)); 3668a3bb6f32SFande Kong lid--; 366925b670f0SStefano Zampini jj[i] = lid; 3670a3bb6f32SFande Kong } 36719566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 36729566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy(&gid1_lid1)); 36739566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36749566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36759566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 3676a3bb6f32SFande Kong PetscFunctionReturn(0); 3677a3bb6f32SFande Kong } 3678a3bb6f32SFande Kong 3679bef8e0ddSBarry Smith /*@ 3680bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3681bef8e0ddSBarry Smith in the matrix. 3682bef8e0ddSBarry Smith 3683bef8e0ddSBarry Smith Input Parameters: 368411a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3685bef8e0ddSBarry Smith - indices - the column indices 3686bef8e0ddSBarry Smith 368715091d37SBarry Smith Level: advanced 368815091d37SBarry Smith 3689bef8e0ddSBarry Smith Notes: 3690bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3691bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 369211a5261eSBarry Smith of the `MatSetValues()` operation. 3693bef8e0ddSBarry Smith 3694bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 369511a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3696bef8e0ddSBarry Smith 369711a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3698bef8e0ddSBarry Smith 3699b9617806SBarry Smith The indices should start with zero, not one. 3700b9617806SBarry Smith 3701bef8e0ddSBarry Smith @*/ 3702d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3703d71ae5a4SJacob Faibussowitsch { 3704bef8e0ddSBarry Smith PetscFunctionBegin; 37050700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3706dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 3707cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 3708bef8e0ddSBarry Smith PetscFunctionReturn(0); 3709bef8e0ddSBarry Smith } 3710bef8e0ddSBarry Smith 3711be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3712be6bf707SBarry Smith 3713d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3714d71ae5a4SJacob Faibussowitsch { 3715be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3716d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3717be6bf707SBarry Smith 3718be6bf707SBarry Smith PetscFunctionBegin; 371928b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3720be6bf707SBarry Smith 3721be6bf707SBarry Smith /* allocate space for values if not already there */ 37224dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3723be6bf707SBarry Smith 3724be6bf707SBarry Smith /* copy values over */ 37259566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 3726be6bf707SBarry Smith PetscFunctionReturn(0); 3727be6bf707SBarry Smith } 3728be6bf707SBarry Smith 3729be6bf707SBarry Smith /*@ 3730be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3731be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3732be6bf707SBarry Smith nonlinear portion. 3733be6bf707SBarry Smith 3734c3339decSBarry Smith Logically Collect 3735be6bf707SBarry Smith 3736be6bf707SBarry Smith Input Parameters: 373711a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3738be6bf707SBarry Smith 373915091d37SBarry Smith Level: advanced 374015091d37SBarry Smith 374111a5261eSBarry Smith Common Usage, with `SNESSolve()`: 3742be6bf707SBarry Smith $ Create Jacobian matrix 3743be6bf707SBarry Smith $ Set linear terms into matrix 3744be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3745be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3746be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3747512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3748be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3749be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3750be6bf707SBarry Smith $ In your Jacobian routine 3751be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3752be6bf707SBarry Smith $ Set nonlinear terms in matrix 3753be6bf707SBarry Smith 3754be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3755be6bf707SBarry Smith $ // build linear portion of Jacobian 3756512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3757be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3758be6bf707SBarry Smith $ loop over nonlinear iterations 3759be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3760be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3761be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3762be6bf707SBarry Smith $ Solve linear system with Jacobian 3763be6bf707SBarry Smith $ endloop 3764be6bf707SBarry Smith 3765be6bf707SBarry Smith Notes: 3766be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 376711a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3768be6bf707SBarry Smith calling this routine. 3769be6bf707SBarry Smith 37700c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37710c468ba9SBarry Smith and does not allocated additional space. 37720c468ba9SBarry Smith 3773db781477SPatrick Sanan .seealso: `MatRetrieveValues()` 3774be6bf707SBarry Smith @*/ 3775d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3776d71ae5a4SJacob Faibussowitsch { 3777be6bf707SBarry Smith PetscFunctionBegin; 37780700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 377928b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 378028b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3781cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 3782be6bf707SBarry Smith PetscFunctionReturn(0); 3783be6bf707SBarry Smith } 3784be6bf707SBarry Smith 3785d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3786d71ae5a4SJacob Faibussowitsch { 3787be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3788d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3789be6bf707SBarry Smith 3790be6bf707SBarry Smith PetscFunctionBegin; 379128b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 379228b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3793be6bf707SBarry Smith /* copy values over */ 37949566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 3795be6bf707SBarry Smith PetscFunctionReturn(0); 3796be6bf707SBarry Smith } 3797be6bf707SBarry Smith 3798be6bf707SBarry Smith /*@ 3799be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3800be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3801be6bf707SBarry Smith nonlinear portion. 3802be6bf707SBarry Smith 3803c3339decSBarry Smith Logically Collect 3804be6bf707SBarry Smith 3805be6bf707SBarry Smith Input Parameters: 380611a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3807be6bf707SBarry Smith 380815091d37SBarry Smith Level: advanced 380915091d37SBarry Smith 3810db781477SPatrick Sanan .seealso: `MatStoreValues()` 3811be6bf707SBarry Smith @*/ 3812d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3813d71ae5a4SJacob Faibussowitsch { 3814be6bf707SBarry Smith PetscFunctionBegin; 38150700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 381628b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 381728b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3818cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 3819be6bf707SBarry Smith PetscFunctionReturn(0); 3820be6bf707SBarry Smith } 3821be6bf707SBarry Smith 3822be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 382317ab2063SBarry Smith /*@C 382411a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38250d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 38266e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 382751c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 38282bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 382917ab2063SBarry Smith 3830d083f849SBarry Smith Collective 3831db81eaa0SLois Curfman McInnes 383217ab2063SBarry Smith Input Parameters: 383311a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 383417ab2063SBarry Smith . m - number of rows 383517ab2063SBarry Smith . n - number of columns 383617ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 383751c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38380298fd71SBarry Smith (possibly different for each row) or NULL 383917ab2063SBarry Smith 384017ab2063SBarry Smith Output Parameter: 3841416022c9SBarry Smith . A - the matrix 384217ab2063SBarry Smith 384311a5261eSBarry Smith It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 3844f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 384511a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 3846175b88e8SBarry Smith 3847b259b22eSLois Curfman McInnes Notes: 384849a6f317SBarry Smith If nnz is given then nz is ignored 384949a6f317SBarry Smith 385011a5261eSBarry Smith The AIJ format, also called 385111a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 38520002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 385344cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 385417ab2063SBarry Smith 385517ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 385611a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 38573d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 38586da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 385917ab2063SBarry Smith 3860682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38614fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3862682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38636c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38646c7ebb05SLois Curfman McInnes 38656c7ebb05SLois Curfman McInnes Options Database Keys: 3866698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 38679db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 386817ab2063SBarry Smith 3869027ccd11SLois Curfman McInnes Level: intermediate 3870027ccd11SLois Curfman McInnes 387160161072SBarry Smith .seealso: [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 387217ab2063SBarry Smith @*/ 3873d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3874d71ae5a4SJacob Faibussowitsch { 38753a40ed3dSBarry Smith PetscFunctionBegin; 38769566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38779566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38789566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 3880273d9f13SBarry Smith PetscFunctionReturn(0); 3881273d9f13SBarry Smith } 3882273d9f13SBarry Smith 3883273d9f13SBarry Smith /*@C 3884273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3885273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3886273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3887273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3888273d9f13SBarry Smith 3889d083f849SBarry Smith Collective 3890273d9f13SBarry Smith 3891273d9f13SBarry Smith Input Parameters: 38921c4f3114SJed Brown + B - The matrix 3893273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3894273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38950298fd71SBarry Smith (possibly different for each row) or NULL 3896273d9f13SBarry Smith 3897273d9f13SBarry Smith Notes: 389849a6f317SBarry Smith If nnz is given then nz is ignored 389949a6f317SBarry Smith 390011a5261eSBarry Smith The `MATSEQAIJ` format also called 390111a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 3902273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3903273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3904273d9f13SBarry Smith 3905273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 390611a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 3907273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3908273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3909273d9f13SBarry Smith 391011a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3911aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3912aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3913aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3914aa95bbe8SBarry Smith 391511a5261eSBarry Smith Developer Notes: 391611a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3917a96a251dSBarry Smith entries or columns indices 3918a96a251dSBarry Smith 3919273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3920273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3921273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3922273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3923273d9f13SBarry Smith 3924273d9f13SBarry Smith Options Database Keys: 3925698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 392647b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3927273d9f13SBarry Smith 3928273d9f13SBarry Smith Level: intermediate 3929273d9f13SBarry Smith 3930db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3931db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3932273d9f13SBarry Smith @*/ 3933d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3934d71ae5a4SJacob Faibussowitsch { 3935a23d5eceSKris Buschelman PetscFunctionBegin; 39366ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39376ba663aaSJed Brown PetscValidType(B, 1); 3938cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 3939a23d5eceSKris Buschelman PetscFunctionReturn(0); 3940a23d5eceSKris Buschelman } 3941a23d5eceSKris Buschelman 3942d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3943d71ae5a4SJacob Faibussowitsch { 3944273d9f13SBarry Smith Mat_SeqAIJ *b; 39452576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 394697f1f81fSBarry Smith PetscInt i; 3947273d9f13SBarry Smith 3948273d9f13SBarry Smith PetscFunctionBegin; 39492576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3950a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3951c461c341SBarry Smith skipallocation = PETSC_TRUE; 3952c461c341SBarry Smith nz = 0; 3953c461c341SBarry Smith } 39549566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39559566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3956899cda47SBarry Smith 3957435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 395808401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 3959cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3960d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 396108401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 396208401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3963b73539f3SBarry Smith } 3964b73539f3SBarry Smith } 3965b73539f3SBarry Smith 3966273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 39672205254eSKarl Rupp 3968273d9f13SBarry Smith b = (Mat_SeqAIJ *)B->data; 3969273d9f13SBarry Smith 3970ab93d7beSBarry Smith if (!skipallocation) { 39714dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3972071fcb05SBarry Smith if (!b->ilen) { 3973071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39749566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3975071fcb05SBarry Smith } else { 39769566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39772ee49352SLisandro Dalcin } 39784dfa11a4SJacob Faibussowitsch if (!b->ipre) { PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); } 3979273d9f13SBarry Smith if (!nnz) { 3980435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3981c62bd62aSJed Brown else if (nz < 0) nz = 1; 39825d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 3983d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 3984d0f46423SBarry Smith nz = nz * B->rmap->n; 3985273d9f13SBarry Smith } else { 3986c73702f5SBarry Smith PetscInt64 nz64 = 0; 39879371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 39889371c9d4SSatish Balay b->imax[i] = nnz[i]; 39899371c9d4SSatish Balay nz64 += nnz[i]; 39909371c9d4SSatish Balay } 39919566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 3992273d9f13SBarry Smith } 3993ab93d7beSBarry Smith 3994273d9f13SBarry Smith /* allocate the matrix space */ 399553dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 39969566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 3997396832f4SHong Zhang if (B->structure_only) { 39989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &b->j)); 39999566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i)); 4000396832f4SHong Zhang } else { 40019566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i)); 4002396832f4SHong Zhang } 4003bfeeae90SHong Zhang b->i[0] = 0; 4004ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4005396832f4SHong Zhang if (B->structure_only) { 4006396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4007396832f4SHong Zhang b->free_a = PETSC_FALSE; 4008396832f4SHong Zhang } else { 4009273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4010e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4011396832f4SHong Zhang } 4012e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4013c461c341SBarry Smith } else { 4014e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4015e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4016c461c341SBarry Smith } 4017273d9f13SBarry Smith 4018846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4019846b4da1SFande Kong /* reserve user-requested sparsity */ 40209566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4021846b4da1SFande Kong } 4022846b4da1SFande Kong 4023273d9f13SBarry Smith b->nz = 0; 4024273d9f13SBarry Smith b->maxnz = nz; 4025273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40261baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4027cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4028cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40295519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40305519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40315519a089SJose E. Roman */ 40325519a089SJose E. Roman B->nonzerostate++; 4033273d9f13SBarry Smith PetscFunctionReturn(0); 4034273d9f13SBarry Smith } 4035273d9f13SBarry Smith 4036d71ae5a4SJacob Faibussowitsch PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4037d71ae5a4SJacob Faibussowitsch { 4038846b4da1SFande Kong Mat_SeqAIJ *a; 4039a5bbaf83SFande Kong PetscInt i; 4040846b4da1SFande Kong 4041846b4da1SFande Kong PetscFunctionBegin; 4042846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 404314d0e64fSAlex Lindsay 404414d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 404514d0e64fSAlex Lindsay if (!A->rmap->n) PetscFunctionReturn(0); 404614d0e64fSAlex Lindsay 4047846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40482c814fdeSFande Kong /* if no saved info, we error out */ 404928b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40502c814fdeSFande Kong 4051aed4548fSBarry Smith PetscCheck(a->i && a->j && a->a && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40522c814fdeSFande Kong 40539566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40549566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4055846b4da1SFande Kong a->i[0] = 0; 4056ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4057846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4058846b4da1SFande Kong a->nz = 0; 4059846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4060846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4061846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4062846b4da1SFande Kong A->assembled = PETSC_FALSE; 4063846b4da1SFande Kong PetscFunctionReturn(0); 4064846b4da1SFande Kong } 4065846b4da1SFande Kong 406658d36128SBarry Smith /*@ 406711a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4068a1661176SMatthew Knepley 4069a1661176SMatthew Knepley Input Parameters: 4070a1661176SMatthew Knepley + B - the matrix 4071a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4072a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4073a1661176SMatthew Knepley - v - optional values in the matrix 4074a1661176SMatthew Knepley 4075a1661176SMatthew Knepley Level: developer 4076a1661176SMatthew Knepley 40776a9b8d82SBarry Smith Notes: 407811a5261eSBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 407958d36128SBarry Smith 40806a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 40816a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 40826a9b8d82SBarry Smith 40836a9b8d82SBarry Smith Developer Notes: 40846a9b8d82SBarry Smith An optimization could be added to the implementation where it checks if the i, and j are identical to the current i and j and 408511a5261eSBarry Smith then just copies the v values directly with `PetscMemcpy()`. 40866a9b8d82SBarry Smith 408711a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 40886a9b8d82SBarry Smith 4089db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MatResetPreallocation()` 4090a1661176SMatthew Knepley @*/ 4091d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4092d71ae5a4SJacob Faibussowitsch { 4093a1661176SMatthew Knepley PetscFunctionBegin; 40940700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 40956ba663aaSJed Brown PetscValidType(B, 1); 4096cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 4097a1661176SMatthew Knepley PetscFunctionReturn(0); 4098a1661176SMatthew Knepley } 4099a1661176SMatthew Knepley 4100d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4101d71ae5a4SJacob Faibussowitsch { 4102a1661176SMatthew Knepley PetscInt i; 4103a1661176SMatthew Knepley PetscInt m, n; 4104a1661176SMatthew Knepley PetscInt nz; 41056a9b8d82SBarry Smith PetscInt *nnz; 4106a1661176SMatthew Knepley 4107a1661176SMatthew Knepley PetscFunctionBegin; 4108aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4109779a8d59SSatish Balay 41109566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41119566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4112779a8d59SSatish Balay 41139566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41149566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4115a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4116b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 411708401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4118a1661176SMatthew Knepley nnz[i] = nz; 4119a1661176SMatthew Knepley } 41209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41219566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4122a1661176SMatthew Knepley 412348a46eb9SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES)); 4124a1661176SMatthew Knepley 41259566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41269566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4127a1661176SMatthew Knepley 41289566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 4129a1661176SMatthew Knepley PetscFunctionReturn(0); 4130a1661176SMatthew Knepley } 4131a1661176SMatthew Knepley 4132ad7e164aSPierre Jolivet /*@ 4133ad7e164aSPierre Jolivet MatSeqAIJKron - Computes C, the Kronecker product of A and B. 4134ad7e164aSPierre Jolivet 4135ad7e164aSPierre Jolivet Input Parameters: 4136ad7e164aSPierre Jolivet + A - left-hand side matrix 4137ad7e164aSPierre Jolivet . B - right-hand side matrix 413811a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4139ad7e164aSPierre Jolivet 4140ad7e164aSPierre Jolivet Output Parameter: 4141ad7e164aSPierre Jolivet . C - Kronecker product of A and B 4142ad7e164aSPierre Jolivet 4143ad7e164aSPierre Jolivet Level: intermediate 4144ad7e164aSPierre Jolivet 414511a5261eSBarry Smith Note: 414611a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4147ad7e164aSPierre Jolivet 4148db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4149ad7e164aSPierre Jolivet @*/ 4150d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4151d71ae5a4SJacob Faibussowitsch { 4152ad7e164aSPierre Jolivet PetscFunctionBegin; 4153ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4154ad7e164aSPierre Jolivet PetscValidType(A, 1); 4155ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4156ad7e164aSPierre Jolivet PetscValidType(B, 2); 4157ad7e164aSPierre Jolivet PetscValidPointer(C, 4); 4158ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4159ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4160ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4161ad7e164aSPierre Jolivet } 4162cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 4163ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4164ad7e164aSPierre Jolivet } 4165ad7e164aSPierre Jolivet 4166d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4167d71ae5a4SJacob Faibussowitsch { 4168ad7e164aSPierre Jolivet Mat newmat; 4169ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4170ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4171ad7e164aSPierre Jolivet PetscScalar *v; 4172fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4173ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4174ad7e164aSPierre Jolivet PetscBool flg; 4175ad7e164aSPierre Jolivet 4176ad7e164aSPierre Jolivet PetscFunctionBegin; 417728b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 417828b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 417928b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 418028b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 41819566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 418228b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4183aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4184ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 41859566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 41869566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 41879566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 41889566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4189ad7e164aSPierre Jolivet i[0] = 0; 4190ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4191ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4192ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4193ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4194ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4195ad7e164aSPierre Jolivet } 4196ad7e164aSPierre Jolivet } 4197ad7e164aSPierre Jolivet } 41989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4199ad7e164aSPierre Jolivet *C = newmat; 42009566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4201ad7e164aSPierre Jolivet nnz = 0; 4202ad7e164aSPierre Jolivet } 42039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4206ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4207ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4208ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4209ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4210ad7e164aSPierre Jolivet } 4211ad7e164aSPierre Jolivet } 4212ad7e164aSPierre Jolivet } 42139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 4216ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4217ad7e164aSPierre Jolivet } 4218ad7e164aSPierre Jolivet 4219c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4220af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4221170fe5c8SBarry Smith 4222170fe5c8SBarry Smith /* 4223170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4224170fe5c8SBarry Smith 4225170fe5c8SBarry Smith n p p 42262da392ccSBarry Smith [ ] [ ] [ ] 42272da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42282da392ccSBarry Smith [ ] [ ] [ ] 4229170fe5c8SBarry Smith 4230170fe5c8SBarry Smith */ 4231d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4232d71ae5a4SJacob Faibussowitsch { 4233170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4234170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4235170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 423686214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4237170fe5c8SBarry Smith const PetscInt *ii, *idx; 4238170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4239170fe5c8SBarry Smith PetscScalar *c, *c_q; 424086214ceeSStefano Zampini PetscInt clda = sub_c->lda; 424186214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4242170fe5c8SBarry Smith 4243170fe5c8SBarry Smith PetscFunctionBegin; 4244d0f46423SBarry Smith m = A->rmap->n; 4245d0f46423SBarry Smith n = A->cmap->n; 4246d0f46423SBarry Smith p = B->cmap->n; 4247170fe5c8SBarry Smith a = sub_a->v; 4248170fe5c8SBarry Smith b = sub_b->a; 4249170fe5c8SBarry Smith c = sub_c->v; 425086214ceeSStefano Zampini if (clda == m) { 42519566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 425286214ceeSStefano Zampini } else { 425386214ceeSStefano Zampini for (j = 0; j < p; j++) 42549371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 425586214ceeSStefano Zampini } 4256170fe5c8SBarry Smith ii = sub_b->i; 4257170fe5c8SBarry Smith idx = sub_b->j; 4258170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4259170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4260170fe5c8SBarry Smith while (q-- > 0) { 426186214ceeSStefano Zampini c_q = c + clda * (*idx); 426286214ceeSStefano Zampini a_q = a + alda * i; 4263854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4264170fe5c8SBarry Smith idx++; 4265170fe5c8SBarry Smith b++; 4266170fe5c8SBarry Smith } 4267170fe5c8SBarry Smith } 4268170fe5c8SBarry Smith PetscFunctionReturn(0); 4269170fe5c8SBarry Smith } 4270170fe5c8SBarry Smith 4271d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4272d71ae5a4SJacob Faibussowitsch { 4273d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 427486214ceeSStefano Zampini PetscBool cisdense; 4275170fe5c8SBarry Smith 4276170fe5c8SBarry Smith PetscFunctionBegin; 427708401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 42789566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 42799566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 42809566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, "")); 428148a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 42829566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4283d73949e8SHong Zhang 42844222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 4285170fe5c8SBarry Smith PetscFunctionReturn(0); 4286170fe5c8SBarry Smith } 4287170fe5c8SBarry Smith 4288170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 42890bad9183SKris Buschelman /*MC 4290fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 42910bad9183SKris Buschelman based on compressed sparse row format. 42920bad9183SKris Buschelman 42930bad9183SKris Buschelman Options Database Keys: 42940bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 42950bad9183SKris Buschelman 42960bad9183SKris Buschelman Level: beginner 42970bad9183SKris Buschelman 42980cd7f59aSBarry Smith Notes: 429911a5261eSBarry Smith `MatSetValues()` may be called for this matrix type with a NULL argument for the numerical values, 43000cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43010cd7f59aSBarry Smith in the matrix 43020cd7f59aSBarry Smith 430311a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 430411a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43050cd7f59aSBarry Smith 430611a5261eSBarry Smith Developer Note: 43070cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 43080cd7f59aSBarry Smith 4309db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43100bad9183SKris Buschelman M*/ 43110bad9183SKris Buschelman 4312ccd284c7SBarry Smith /*MC 4313ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4314ccd284c7SBarry Smith 431511a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 431611a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 431711a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4318ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4319ccd284c7SBarry Smith the above preallocation routines for simplicity. 4320ccd284c7SBarry Smith 4321ccd284c7SBarry Smith Options Database Keys: 432211a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4323ccd284c7SBarry Smith 432411a5261eSBarry Smith Note: 432511a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4326ccd284c7SBarry Smith enough exist. 4327ccd284c7SBarry Smith 4328ccd284c7SBarry Smith Level: beginner 4329ccd284c7SBarry Smith 4330db781477SPatrick Sanan .seealso: `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4331ccd284c7SBarry Smith M*/ 4332ccd284c7SBarry Smith 4333ccd284c7SBarry Smith /*MC 4334ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4335ccd284c7SBarry Smith 433611a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 433711a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 433811a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4339ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4340ccd284c7SBarry Smith the above preallocation routines for simplicity. 4341ccd284c7SBarry Smith 4342ccd284c7SBarry Smith Options Database Keys: 434311a5261eSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 4344ccd284c7SBarry Smith 4345ccd284c7SBarry Smith Level: beginner 4346ccd284c7SBarry Smith 4347c2e3fba1SPatrick Sanan .seealso: `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4348ccd284c7SBarry Smith M*/ 4349ccd284c7SBarry Smith 43507906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43517906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43527906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43537906f579SHong Zhang #endif 4354d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4355d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4356d24d4204SJose E. Roman #endif 43577906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43587906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43597906f579SHong Zhang #endif 43607906f579SHong Zhang 4361d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4362c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43634222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43647906f579SHong Zhang 43658c778c55SBarry Smith /*@C 436611a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43678c778c55SBarry Smith 43688c778c55SBarry Smith Not Collective 43698c778c55SBarry Smith 43708c778c55SBarry Smith Input Parameter: 437111a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 43728c778c55SBarry Smith 43738c778c55SBarry Smith Output Parameter: 43748c778c55SBarry Smith . array - pointer to the data 43758c778c55SBarry Smith 43768c778c55SBarry Smith Level: intermediate 43778c778c55SBarry Smith 4378db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 43798c778c55SBarry Smith @*/ 4380d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array) 4381d71ae5a4SJacob Faibussowitsch { 4382d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 43838c778c55SBarry Smith 43848c778c55SBarry Smith PetscFunctionBegin; 4385d67d9f35SJunchao Zhang if (aij->ops->getarray) { 43869566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4387d67d9f35SJunchao Zhang } else { 4388d67d9f35SJunchao Zhang *array = aij->a; 4389d67d9f35SJunchao Zhang } 4390d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4391d67d9f35SJunchao Zhang } 4392d67d9f35SJunchao Zhang 4393d67d9f35SJunchao Zhang /*@C 439411a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4395d67d9f35SJunchao Zhang 4396d67d9f35SJunchao Zhang Not Collective 4397d67d9f35SJunchao Zhang 4398d67d9f35SJunchao Zhang Input Parameters: 439911a5261eSBarry Smith + mat - a `MATSEQAIJ` matrix 4400d67d9f35SJunchao Zhang - array - pointer to the data 4401d67d9f35SJunchao Zhang 4402d67d9f35SJunchao Zhang Level: intermediate 4403d67d9f35SJunchao Zhang 4404db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4405d67d9f35SJunchao Zhang @*/ 4406d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array) 4407d71ae5a4SJacob Faibussowitsch { 4408d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4409d67d9f35SJunchao Zhang 4410d67d9f35SJunchao Zhang PetscFunctionBegin; 4411d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44129566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4413d67d9f35SJunchao Zhang } else { 4414d67d9f35SJunchao Zhang *array = NULL; 4415d67d9f35SJunchao Zhang } 44169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44179566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44188c778c55SBarry Smith PetscFunctionReturn(0); 44198c778c55SBarry Smith } 44208c778c55SBarry Smith 442121e72a00SBarry Smith /*@C 442211a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44238f1ea47aSStefano Zampini 44248f1ea47aSStefano Zampini Not Collective 44258f1ea47aSStefano Zampini 44268f1ea47aSStefano Zampini Input Parameter: 442711a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44288f1ea47aSStefano Zampini 44298f1ea47aSStefano Zampini Output Parameter: 44308f1ea47aSStefano Zampini . array - pointer to the data 44318f1ea47aSStefano Zampini 44328f1ea47aSStefano Zampini Level: intermediate 44338f1ea47aSStefano Zampini 4434db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44358f1ea47aSStefano Zampini @*/ 4436d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array) 4437d71ae5a4SJacob Faibussowitsch { 4438d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44398f1ea47aSStefano Zampini 44408f1ea47aSStefano Zampini PetscFunctionBegin; 4441d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44429566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4443d67d9f35SJunchao Zhang } else { 4444d67d9f35SJunchao Zhang *array = aij->a; 4445d67d9f35SJunchao Zhang } 44468f1ea47aSStefano Zampini PetscFunctionReturn(0); 44478f1ea47aSStefano Zampini } 44488f1ea47aSStefano Zampini 44498f1ea47aSStefano Zampini /*@C 445011a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44518f1ea47aSStefano Zampini 44528f1ea47aSStefano Zampini Not Collective 44538f1ea47aSStefano Zampini 44548f1ea47aSStefano Zampini Input Parameter: 445511a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44568f1ea47aSStefano Zampini 44578f1ea47aSStefano Zampini Output Parameter: 44588f1ea47aSStefano Zampini . array - pointer to the data 44598f1ea47aSStefano Zampini 44608f1ea47aSStefano Zampini Level: intermediate 44618f1ea47aSStefano Zampini 4462db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44638f1ea47aSStefano Zampini @*/ 4464d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array) 4465d71ae5a4SJacob Faibussowitsch { 4466d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44678f1ea47aSStefano Zampini 44688f1ea47aSStefano Zampini PetscFunctionBegin; 4469d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44709566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4471d67d9f35SJunchao Zhang } else { 4472d67d9f35SJunchao Zhang *array = NULL; 4473d67d9f35SJunchao Zhang } 4474d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4475d67d9f35SJunchao Zhang } 4476d67d9f35SJunchao Zhang 4477d67d9f35SJunchao Zhang /*@C 447811a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4479d67d9f35SJunchao Zhang 4480d67d9f35SJunchao Zhang Not Collective 4481d67d9f35SJunchao Zhang 4482d67d9f35SJunchao Zhang Input Parameter: 448311a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 4484d67d9f35SJunchao Zhang 4485d67d9f35SJunchao Zhang Output Parameter: 4486d67d9f35SJunchao Zhang . array - pointer to the data 4487d67d9f35SJunchao Zhang 4488d67d9f35SJunchao Zhang Level: intermediate 4489d67d9f35SJunchao Zhang 4490db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4491d67d9f35SJunchao Zhang @*/ 4492d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array) 4493d71ae5a4SJacob Faibussowitsch { 4494d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4495d67d9f35SJunchao Zhang 4496d67d9f35SJunchao Zhang PetscFunctionBegin; 4497d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 44989566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4499d67d9f35SJunchao Zhang } else { 4500d67d9f35SJunchao Zhang *array = aij->a; 4501d67d9f35SJunchao Zhang } 45029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45039566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 4504d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4505d67d9f35SJunchao Zhang } 4506d67d9f35SJunchao Zhang 4507d67d9f35SJunchao Zhang /*@C 4508d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4509d67d9f35SJunchao Zhang 4510d67d9f35SJunchao Zhang Not Collective 4511d67d9f35SJunchao Zhang 4512d67d9f35SJunchao Zhang Input Parameter: 4513d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4514d67d9f35SJunchao Zhang 4515d67d9f35SJunchao Zhang Output Parameter: 4516d67d9f35SJunchao Zhang . array - pointer to the data 4517d67d9f35SJunchao Zhang 4518d67d9f35SJunchao Zhang Level: intermediate 4519d67d9f35SJunchao Zhang 4520db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4521d67d9f35SJunchao Zhang @*/ 4522d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array) 4523d71ae5a4SJacob Faibussowitsch { 4524d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4525d67d9f35SJunchao Zhang 4526d67d9f35SJunchao Zhang PetscFunctionBegin; 4527d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45289566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4529d67d9f35SJunchao Zhang } else { 4530d67d9f35SJunchao Zhang *array = NULL; 4531d67d9f35SJunchao Zhang } 45328f1ea47aSStefano Zampini PetscFunctionReturn(0); 45338f1ea47aSStefano Zampini } 45348f1ea47aSStefano Zampini 45358f1ea47aSStefano Zampini /*@C 453611a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45377ee59b9bSJunchao Zhang 45387ee59b9bSJunchao Zhang Not Collective 45397ee59b9bSJunchao Zhang 45407ee59b9bSJunchao Zhang Input Parameter: 454111a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45427ee59b9bSJunchao Zhang 45437ee59b9bSJunchao Zhang Output Parameters: 45447ee59b9bSJunchao Zhang + i - row map array of the matrix 45457ee59b9bSJunchao Zhang . j - column index array of the matrix 45467ee59b9bSJunchao Zhang . a - data array of the matrix 45477ee59b9bSJunchao Zhang - memtype - memory type of the arrays 45487ee59b9bSJunchao Zhang 45497ee59b9bSJunchao Zhang Notes: 45507ee59b9bSJunchao Zhang Any of the output parameters can be NULL, in which case the corresponding value is not returned. 45517ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45527ee59b9bSJunchao Zhang 45537ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45547ee59b9bSJunchao Zhang If the matrix is assembled, the data array 'a' is guaranteed to have the latest values of the matrix. 45557ee59b9bSJunchao Zhang 45567ee59b9bSJunchao Zhang Level: Developer 45577ee59b9bSJunchao Zhang 4558db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45597ee59b9bSJunchao Zhang @*/ 4560d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype) 4561d71ae5a4SJacob Faibussowitsch { 45627ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45637ee59b9bSJunchao Zhang 45647ee59b9bSJunchao Zhang PetscFunctionBegin; 45657ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45667ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45677ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45687ee59b9bSJunchao Zhang } else { 45697ee59b9bSJunchao Zhang if (i) *i = aij->i; 45707ee59b9bSJunchao Zhang if (j) *j = aij->j; 45717ee59b9bSJunchao Zhang if (a) *a = aij->a; 45727ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 45737ee59b9bSJunchao Zhang } 45747ee59b9bSJunchao Zhang PetscFunctionReturn(0); 45757ee59b9bSJunchao Zhang } 45767ee59b9bSJunchao Zhang 45777ee59b9bSJunchao Zhang /*@C 457821e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 457921e72a00SBarry Smith 458021e72a00SBarry Smith Not Collective 458121e72a00SBarry Smith 458221e72a00SBarry Smith Input Parameter: 458311a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 458421e72a00SBarry Smith 458521e72a00SBarry Smith Output Parameter: 458621e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 458721e72a00SBarry Smith 458821e72a00SBarry Smith Level: intermediate 458921e72a00SBarry Smith 4590db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 459121e72a00SBarry Smith @*/ 4592d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4593d71ae5a4SJacob Faibussowitsch { 459421e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 459521e72a00SBarry Smith 459621e72a00SBarry Smith PetscFunctionBegin; 459721e72a00SBarry Smith *nz = aij->rmax; 459821e72a00SBarry Smith PetscFunctionReturn(0); 459921e72a00SBarry Smith } 460021e72a00SBarry Smith 4601d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4602d71ae5a4SJacob Faibussowitsch { 4603394ed5ebSJunchao Zhang MPI_Comm comm; 4604394ed5ebSJunchao Zhang PetscInt *i, *j; 4605394ed5ebSJunchao Zhang PetscInt M, N, row; 4606394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4607394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4608394ed5ebSJunchao Zhang PetscInt *Aj; 4609394ed5ebSJunchao Zhang PetscScalar *Aa; 4610cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)(mat->data); 4611cbc6b225SStefano Zampini MatType rtype; 4612394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 4613394ed5ebSJunchao Zhang 4614394ed5ebSJunchao Zhang PetscFunctionBegin; 46159566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(mat)); 46169566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46179566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4618e8729f6fSJunchao Zhang i = coo_i; 4619e8729f6fSJunchao Zhang j = coo_j; 46209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 4621394ed5ebSJunchao Zhang for (k = 0; k < coo_n; k++) { /* Ignore entries with negative row or col indices */ 4622394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4623394ed5ebSJunchao Zhang perm[k] = k; 4624394ed5ebSJunchao Zhang } 4625394ed5ebSJunchao Zhang 4626394ed5ebSJunchao Zhang /* Sort by row */ 46279566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 46289371c9d4SSatish Balay for (k = 0; k < coo_n; k++) { 46299371c9d4SSatish Balay if (i[k] >= 0) break; 46309371c9d4SSatish Balay } /* Advance k to the first row with a non-negative index */ 4631394ed5ebSJunchao Zhang nneg = k; 46329566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4633394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 4634394ed5ebSJunchao Zhang jmap++; /* Inc jmap by 1 for convinience */ 4635394ed5ebSJunchao Zhang 46369566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M + 1, &Ai)); /* CSR of A */ 46379566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4638394ed5ebSJunchao Zhang 4639394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 4640394ed5ebSJunchao Zhang Ai++; /* Inc by 1 for convinience */ 4641394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4642394ed5ebSJunchao Zhang while (k < coo_n) { 4643394ed5ebSJunchao Zhang row = i[k]; 4644394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4645394ed5ebSJunchao Zhang while (k < coo_n && i[k] == row) k++; 4646394ed5ebSJunchao Zhang end = k; 46479566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4648394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4649394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4650394ed5ebSJunchao Zhang jmap[q] = 1; /* Number of repeats of this nozero entry */ 4651394ed5ebSJunchao Zhang Ai[row] = 1; 4652394ed5ebSJunchao Zhang nnz++; 4653394ed5ebSJunchao Zhang 4654394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4655394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4656394ed5ebSJunchao Zhang q++; 4657394ed5ebSJunchao Zhang jmap[q] = 1; 4658394ed5ebSJunchao Zhang Aj[q] = j[p]; 4659394ed5ebSJunchao Zhang Ai[row]++; 4660394ed5ebSJunchao Zhang nnz++; 4661394ed5ebSJunchao Zhang } else { 4662394ed5ebSJunchao Zhang jmap[q]++; 4663394ed5ebSJunchao Zhang } 4664394ed5ebSJunchao Zhang } 4665394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4666394ed5ebSJunchao Zhang } 4667394ed5ebSJunchao Zhang 4668394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4669394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 4670394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4671394ed5ebSJunchao Zhang jmap[0] = 0; 4672394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 4673394ed5ebSJunchao Zhang if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */ 4674394ed5ebSJunchao Zhang PetscCount *jmap_new; 4675394ed5ebSJunchao Zhang PetscInt *Aj_new; 4676394ed5ebSJunchao Zhang 46779566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 46789566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 46799566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4680394ed5ebSJunchao Zhang jmap = jmap_new; 4681394ed5ebSJunchao Zhang 46829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &Aj_new)); 46839566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 46849566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4685394ed5ebSJunchao Zhang Aj = Aj_new; 4686394ed5ebSJunchao Zhang } 4687394ed5ebSJunchao Zhang 4688394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4689394ed5ebSJunchao Zhang PetscCount *perm_new; 4690cbc6b225SStefano Zampini 46919566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 46929566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 46939566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4694394ed5ebSJunchao Zhang perm = perm_new; 4695394ed5ebSJunchao Zhang } 4696394ed5ebSJunchao Zhang 46979566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 46989566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */ 46999566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4700394ed5ebSJunchao Zhang 4701394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4702394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 4703394ed5ebSJunchao Zhang /* Record COO fields */ 4704394ed5ebSJunchao Zhang seqaij->coo_n = coo_n; 4705394ed5ebSJunchao Zhang seqaij->Atot = coo_n - nneg; /* Annz is seqaij->nz, so no need to record that again */ 4706394ed5ebSJunchao Zhang seqaij->jmap = jmap; /* of length nnz+1 */ 4707394ed5ebSJunchao Zhang seqaij->perm = perm; 4708394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4709394ed5ebSJunchao Zhang } 4710394ed5ebSJunchao Zhang 4711d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4712d71ae5a4SJacob Faibussowitsch { 4713394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4714394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 4715394ed5ebSJunchao Zhang PetscCount *perm = aseq->perm, *jmap = aseq->jmap; 4716394ed5ebSJunchao Zhang PetscScalar *Aa; 4717394ed5ebSJunchao Zhang 4718394ed5ebSJunchao Zhang PetscFunctionBegin; 47199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4720394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4721b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4722b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4723b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4724394ed5ebSJunchao Zhang } 47259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 4726394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4727394ed5ebSJunchao Zhang } 4728394ed5ebSJunchao Zhang 472934b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47305063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 473102fe1965SBarry Smith #endif 47323d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47335063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 47343d0639e7SStefano Zampini #endif 473502fe1965SBarry Smith 4736d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4737d71ae5a4SJacob Faibussowitsch { 4738273d9f13SBarry Smith Mat_SeqAIJ *b; 473938baddfdSBarry Smith PetscMPIInt size; 4740273d9f13SBarry Smith 4741273d9f13SBarry Smith PetscFunctionBegin; 47429566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 474308401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4744273d9f13SBarry Smith 47454dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 47462205254eSKarl Rupp 4747b0a32e0cSBarry Smith B->data = (void *)b; 47482205254eSKarl Rupp 47499566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps))); 4750071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 47512205254eSKarl Rupp 4752f4259b30SLisandro Dalcin b->row = NULL; 4753f4259b30SLisandro Dalcin b->col = NULL; 4754f4259b30SLisandro Dalcin b->icol = NULL; 4755b810aeb4SBarry Smith b->reallocs = 0; 475636db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4757f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4758416022c9SBarry Smith b->nonew = 0; 4759f4259b30SLisandro Dalcin b->diag = NULL; 4760f4259b30SLisandro Dalcin b->solve_work = NULL; 4761f4259b30SLisandro Dalcin B->spptr = NULL; 4762f4259b30SLisandro Dalcin b->saved_values = NULL; 4763f4259b30SLisandro Dalcin b->idiag = NULL; 4764f4259b30SLisandro Dalcin b->mdiag = NULL; 4765f4259b30SLisandro Dalcin b->ssor_work = NULL; 476671f1c65dSBarry Smith b->omega = 1.0; 476771f1c65dSBarry Smith b->fshift = 0.0; 476871f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4769bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4770a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 477117ab2063SBarry Smith 47729566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4773d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 47749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 47759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4776b3866ffcSBarry Smith #endif 47779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 47789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 47799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 47809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 47819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 47829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 47839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 47849779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 47859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4786191b95cbSRichard Tran Mills #endif 478734b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 47899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 47909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 479102fe1965SBarry Smith #endif 47923d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 47943d0639e7SStefano Zampini #endif 47959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4796af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 47979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4798af8000cdSHong Zhang #endif 4799d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 48009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4801d24d4204SJose E. Roman #endif 480263c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 48039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 48049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 480563c07aadSStefano Zampini #endif 48069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 48079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 48089566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 48099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 48109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsTranspose_SeqAIJ)); 48119566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 48129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 48139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 48149566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 48159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 48169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 48179566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 48199566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 48209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 48219566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 48229566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 48239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 48243a40ed3dSBarry Smith PetscFunctionReturn(0); 482517ab2063SBarry Smith } 482617ab2063SBarry Smith 4827b24902e0SBarry Smith /* 48283893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4829b24902e0SBarry Smith */ 4830d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4831d71ae5a4SJacob Faibussowitsch { 48322a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4833071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 483417ab2063SBarry Smith 48353a40ed3dSBarry Smith PetscFunctionBegin; 4836aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4837273d9f13SBarry Smith 4838d5f3da31SBarry Smith C->factortype = A->factortype; 4839f4259b30SLisandro Dalcin c->row = NULL; 4840f4259b30SLisandro Dalcin c->col = NULL; 4841f4259b30SLisandro Dalcin c->icol = NULL; 48426ad4291fSHong Zhang c->reallocs = 0; 484317ab2063SBarry Smith 484469272f91SPierre Jolivet C->assembled = A->assembled; 484569272f91SPierre Jolivet C->preallocated = A->preallocated; 484617ab2063SBarry Smith 484769272f91SPierre Jolivet if (A->preallocated) { 48489566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 48499566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4850eec197d1SBarry Smith 48519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 48529566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 48539566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 48549566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 485517ab2063SBarry Smith 485617ab2063SBarry Smith /* allocate the matrix space */ 4857f77e22a1SHong Zhang if (mallocmatspace) { 48589566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i)); 48592205254eSKarl Rupp 4860f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 48612205254eSKarl Rupp 48629566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 486317ab2063SBarry Smith if (m > 0) { 48649566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4865be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 48662e5835c6SStefano Zampini const PetscScalar *aa; 48672e5835c6SStefano Zampini 48689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 48699566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 48709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 4871be6bf707SBarry Smith } else { 48729566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 487317ab2063SBarry Smith } 487408480c60SBarry Smith } 4875f77e22a1SHong Zhang } 487617ab2063SBarry Smith 48776ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4878416022c9SBarry Smith c->roworiented = a->roworiented; 4879416022c9SBarry Smith c->nonew = a->nonew; 4880416022c9SBarry Smith if (a->diag) { 48819566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 48829566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 4883071fcb05SBarry Smith } else c->diag = NULL; 48842205254eSKarl Rupp 4885f4259b30SLisandro Dalcin c->solve_work = NULL; 4886f4259b30SLisandro Dalcin c->saved_values = NULL; 4887f4259b30SLisandro Dalcin c->idiag = NULL; 4888f4259b30SLisandro Dalcin c->ssor_work = NULL; 4889a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4890e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4891e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 48926ad4291fSHong Zhang 4893893ad86cSHong Zhang c->rmax = a->rmax; 4894416022c9SBarry Smith c->nz = a->nz; 48958ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4896754ec7b1SSatish Balay 48976ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 48986ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4899cd6b891eSBarry Smith if (a->compressedrow.use) { 49006ad4291fSHong Zhang i = a->compressedrow.nrows; 49019566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 49029566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 49039566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 490427ea64f8SHong Zhang } else { 490527ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 49060298fd71SBarry Smith c->compressedrow.i = NULL; 49070298fd71SBarry Smith c->compressedrow.rindex = NULL; 49086ad4291fSHong Zhang } 4909ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4910e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 49114846f1f5SKris Buschelman 49129566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 491369272f91SPierre Jolivet } 49149566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 49153a40ed3dSBarry Smith PetscFunctionReturn(0); 491617ab2063SBarry Smith } 491717ab2063SBarry Smith 4918d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 4919d71ae5a4SJacob Faibussowitsch { 4920b24902e0SBarry Smith PetscFunctionBegin; 49219566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 49229566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 492348a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 49249566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 49259566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 4926b24902e0SBarry Smith PetscFunctionReturn(0); 4927b24902e0SBarry Smith } 4928b24902e0SBarry Smith 4929d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4930d71ae5a4SJacob Faibussowitsch { 493152f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 493252f91c60SVaclav Hapla 493352f91c60SVaclav Hapla PetscFunctionBegin; 493452f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 493552f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 4936c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 49379566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 49389566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 49399566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 494052f91c60SVaclav Hapla if (isbinary) { 49419566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 494252f91c60SVaclav Hapla } else if (ishdf5) { 494352f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 49449566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 494552f91c60SVaclav Hapla #else 494652f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 494752f91c60SVaclav Hapla #endif 494852f91c60SVaclav Hapla } else { 494998921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 495052f91c60SVaclav Hapla } 495152f91c60SVaclav Hapla PetscFunctionReturn(0); 495252f91c60SVaclav Hapla } 495352f91c60SVaclav Hapla 4954d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 4955d71ae5a4SJacob Faibussowitsch { 49563ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 49573ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 4958fbdbba38SShri Abhyankar 4959fbdbba38SShri Abhyankar PetscFunctionBegin; 49609566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 4961bbead8a2SBarry Smith 49623ea6fe3dSLisandro Dalcin /* read in matrix header */ 49639566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 496408401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 49659371c9d4SSatish Balay M = header[1]; 49669371c9d4SSatish Balay N = header[2]; 49679371c9d4SSatish Balay nz = header[3]; 496808401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 496908401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 497008401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 4971fbdbba38SShri Abhyankar 49723ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 49739566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 49743ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 49753ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 49763ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 49773ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 49783ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 49799566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 49809566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 49813ea6fe3dSLisandro Dalcin 49823ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 49839566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 4984aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 49853ea6fe3dSLisandro Dalcin 4986fbdbba38SShri Abhyankar /* read in row lengths */ 49879566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 49889566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 49893ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 49909371c9d4SSatish Balay sum = 0; 49919371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 499208401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 49933ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 49949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 49959566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 4996aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 49973ea6fe3dSLisandro Dalcin /* store row lengths */ 49989566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 49999566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5000fbdbba38SShri Abhyankar 50013ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 50029371c9d4SSatish Balay a->i[0] = 0; 50039371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 50043ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 50059566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 50063ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 50079566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5008fbdbba38SShri Abhyankar 50099566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 50109566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 5011fbdbba38SShri Abhyankar PetscFunctionReturn(0); 5012fbdbba38SShri Abhyankar } 5013fbdbba38SShri Abhyankar 5014d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5015d71ae5a4SJacob Faibussowitsch { 50167264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5017fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5018eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5019eeffb40dSHong Zhang PetscInt k; 5020eeffb40dSHong Zhang #endif 50217264ac53SSatish Balay 50223a40ed3dSBarry Smith PetscFunctionBegin; 5023bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5024d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5025ca44d042SBarry Smith *flg = PETSC_FALSE; 5026ca44d042SBarry Smith PetscFunctionReturn(0); 5027bcd2baecSBarry Smith } 50287264ac53SSatish Balay 50297264ac53SSatish Balay /* if the a->i are the same */ 50309566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 5031abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 50327264ac53SSatish Balay 50337264ac53SSatish Balay /* if a->j are the same */ 50349566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 5035abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 5036bcd2baecSBarry Smith 50379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5039bcd2baecSBarry Smith /* if a->a are the same */ 5040eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5041eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5042fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5043eeffb40dSHong Zhang *flg = PETSC_FALSE; 50443a40ed3dSBarry Smith PetscFunctionReturn(0); 5045eeffb40dSHong Zhang } 5046eeffb40dSHong Zhang } 5047eeffb40dSHong Zhang #else 50489566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5049eeffb40dSHong Zhang #endif 50509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 50519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 5052eeffb40dSHong Zhang PetscFunctionReturn(0); 50537264ac53SSatish Balay } 505436db0b34SBarry Smith 505505869f15SSatish Balay /*@ 505611a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 505736db0b34SBarry Smith provided by the user. 505836db0b34SBarry Smith 5059d083f849SBarry Smith Collective 506036db0b34SBarry Smith 506136db0b34SBarry Smith Input Parameters: 506236db0b34SBarry Smith + comm - must be an MPI communicator of size 1 506336db0b34SBarry Smith . m - number of rows 506436db0b34SBarry Smith . n - number of columns 5065483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 506636db0b34SBarry Smith . j - column indices 506736db0b34SBarry Smith - a - matrix values 506836db0b34SBarry Smith 506936db0b34SBarry Smith Output Parameter: 507036db0b34SBarry Smith . mat - the matrix 507136db0b34SBarry Smith 507236db0b34SBarry Smith Level: intermediate 507336db0b34SBarry Smith 507436db0b34SBarry Smith Notes: 50750551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 5076292fb18eSBarry Smith once the matrix is destroyed and not before 507736db0b34SBarry Smith 507836db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 507936db0b34SBarry Smith 5080bfeeae90SHong Zhang The i and j indices are 0 based 508136db0b34SBarry Smith 5082a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5083a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 50848eef79e4SBarry Smith as shown 5085a4552177SSatish Balay 50868eef79e4SBarry Smith $ 1 0 0 50878eef79e4SBarry Smith $ 2 0 3 50888eef79e4SBarry Smith $ 4 5 6 50898eef79e4SBarry Smith $ 50908eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 50918eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 50928eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 5093a4552177SSatish Balay 5094db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 509536db0b34SBarry Smith @*/ 5096d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5097d71ae5a4SJacob Faibussowitsch { 5098cbcfb4deSHong Zhang PetscInt ii; 509936db0b34SBarry Smith Mat_SeqAIJ *aij; 5100cbcfb4deSHong Zhang PetscInt jj; 510136db0b34SBarry Smith 510236db0b34SBarry Smith PetscFunctionBegin; 5103aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 51049566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51059566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51069566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 51079566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5109ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 51109566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 51119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5112ab93d7beSBarry Smith 511336db0b34SBarry Smith aij->i = i; 511436db0b34SBarry Smith aij->j = j; 511536db0b34SBarry Smith aij->a = a; 511636db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 511736db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5118e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5119e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 512036db0b34SBarry Smith 5121cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 512236db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 512376bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5124aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 51259985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 512608401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 512708401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 51289985e31cSBarry Smith } 512936db0b34SBarry Smith } 513076bd3646SJed Brown } 513176bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 513236db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 513308401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5134aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 513536db0b34SBarry Smith } 513676bd3646SJed Brown } 513736db0b34SBarry Smith 51389566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 51399566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 514036db0b34SBarry Smith PetscFunctionReturn(0); 514136db0b34SBarry Smith } 5142cbc6b225SStefano Zampini 5143f62e3866SBarry Smith /*@ 514411a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 51458a0b0e6bSVictor Minden provided by the user. 51468a0b0e6bSVictor Minden 5147d083f849SBarry Smith Collective 51488a0b0e6bSVictor Minden 51498a0b0e6bSVictor Minden Input Parameters: 51508a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 51518a0b0e6bSVictor Minden . m - number of rows 51528a0b0e6bSVictor Minden . n - number of columns 51538a0b0e6bSVictor Minden . i - row indices 51548a0b0e6bSVictor Minden . j - column indices 51551230e6d1SVictor Minden . a - matrix values 51561230e6d1SVictor Minden . nz - number of nonzeros 515711a5261eSBarry Smith - idx - if the i and j indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 51588a0b0e6bSVictor Minden 51598a0b0e6bSVictor Minden Output Parameter: 51608a0b0e6bSVictor Minden . mat - the matrix 51618a0b0e6bSVictor Minden 51628a0b0e6bSVictor Minden Level: intermediate 51638a0b0e6bSVictor Minden 5164f62e3866SBarry Smith Example: 5165f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 51669e99939fSJunchao Zhang .vb 51678a0b0e6bSVictor Minden 1 0 0 51688a0b0e6bSVictor Minden 2 0 3 51698a0b0e6bSVictor Minden 4 5 6 51708a0b0e6bSVictor Minden 51718a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 51728a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 51738a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 51749e99939fSJunchao Zhang .ve 5175d7547e51SJunchao Zhang Notes: 5176d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5177d7547e51SJunchao Zhang and are particularly useful in iterative applications. 51788a0b0e6bSVictor Minden 5179d7547e51SJunchao Zhang .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 51808a0b0e6bSVictor Minden @*/ 5181d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5182d71ae5a4SJacob Faibussowitsch { 5183d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 51848a0b0e6bSVictor Minden 51858a0b0e6bSVictor Minden PetscFunctionBegin; 51869566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5187ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 51889566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51899566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51909566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 51921230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 51931230e6d1SVictor Minden if (idx) { 51941230e6d1SVictor Minden row = i[ii] - 1; 51951230e6d1SVictor Minden col = j[ii] - 1; 51961230e6d1SVictor Minden } else { 51971230e6d1SVictor Minden row = i[ii]; 51981230e6d1SVictor Minden col = j[ii]; 51998a0b0e6bSVictor Minden } 52009566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 52018a0b0e6bSVictor Minden } 52029566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52039566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52049566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 52058a0b0e6bSVictor Minden PetscFunctionReturn(0); 52068a0b0e6bSVictor Minden } 520736db0b34SBarry Smith 5208d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5209d71ae5a4SJacob Faibussowitsch { 5210acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5211acf2f550SJed Brown 5212acf2f550SJed Brown PetscFunctionBegin; 5213acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5214acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 52152205254eSKarl Rupp 52169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 5217acf2f550SJed Brown PetscFunctionReturn(0); 5218acf2f550SJed Brown } 5219acf2f550SJed Brown 5220d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5221d71ae5a4SJacob Faibussowitsch { 52229c8f2541SHong Zhang PetscFunctionBegin; 52239566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 52249c8f2541SHong Zhang PetscFunctionReturn(0); 52259c8f2541SHong Zhang } 52269c8f2541SHong Zhang 522781824310SBarry Smith /* 522853dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 522953dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 523053dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 523153dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 523253dd7562SDmitry Karpeev */ 5233d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5234d71ae5a4SJacob Faibussowitsch { 523553dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 523653dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 523753dd7562SDmitry Karpeev PetscBool seqaij; 523853dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 523953dd7562SDmitry Karpeev PetscScalar v; 524053dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 524153dd7562SDmitry Karpeev 524253dd7562SDmitry Karpeev PetscFunctionBegin; 524353dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 524453dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 52459566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 524628b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 524753dd7562SDmitry Karpeev if (rowemb) { 52489566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 524908401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 525053dd7562SDmitry Karpeev } else { 525108401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 525253dd7562SDmitry Karpeev } 525353dd7562SDmitry Karpeev if (colemb) { 52549566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 525508401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 525653dd7562SDmitry Karpeev } else { 525708401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 525853dd7562SDmitry Karpeev } 525953dd7562SDmitry Karpeev 526053dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ *)(B->data); 526153dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 52629566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5263ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 52649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 52659566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 526653dd7562SDmitry Karpeev } 526748a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 526853dd7562SDmitry Karpeev count = 0; 526953dd7562SDmitry Karpeev rowindices = NULL; 527053dd7562SDmitry Karpeev colindices = NULL; 527148a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 527248a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 527353dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 527453dd7562SDmitry Karpeev PetscInt row; 527553dd7562SDmitry Karpeev row = i; 527653dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 527753dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 527853dd7562SDmitry Karpeev PetscInt col; 527953dd7562SDmitry Karpeev col = Baij->j[count]; 528053dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 528153dd7562SDmitry Karpeev v = Baij->a[count]; 52829566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 528353dd7562SDmitry Karpeev ++count; 528453dd7562SDmitry Karpeev } 528553dd7562SDmitry Karpeev } 528653dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 528753dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 528853dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 528953dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 529053dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 529153dd7562SDmitry Karpeev PetscFunctionReturn(0); 529253dd7562SDmitry Karpeev } 529353dd7562SDmitry Karpeev 52944099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 52954099cc6bSBarry Smith 52964099cc6bSBarry Smith /*@C 529711a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 52984099cc6bSBarry Smith 5299c3339decSBarry Smith Collective 53004099cc6bSBarry Smith 53014099cc6bSBarry Smith Input Parameters: 53024099cc6bSBarry Smith + mat - the matrix object 53034099cc6bSBarry Smith - matype - matrix type 53044099cc6bSBarry Smith 53054099cc6bSBarry Smith Options Database Key: 53064099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 53074099cc6bSBarry Smith 53084099cc6bSBarry Smith Level: intermediate 53094099cc6bSBarry Smith 5310db781477SPatrick Sanan .seealso: `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`, `Mat` 53114099cc6bSBarry Smith @*/ 5312d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5313d71ae5a4SJacob Faibussowitsch { 53144099cc6bSBarry Smith PetscBool sametype; 53155f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 53164099cc6bSBarry Smith 53174099cc6bSBarry Smith PetscFunctionBegin; 53184099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 53199566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 53204099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 53214099cc6bSBarry Smith 53229566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 53235f80ce2aSJacob Faibussowitsch PetscCheck(r, PETSC_COMM_SELF, PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 53249566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 53254099cc6bSBarry Smith PetscFunctionReturn(0); 53264099cc6bSBarry Smith } 53274099cc6bSBarry Smith 53284099cc6bSBarry Smith /*@C 532911a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 53304099cc6bSBarry Smith 53314099cc6bSBarry Smith Not Collective 53324099cc6bSBarry Smith 53334099cc6bSBarry Smith Input Parameters: 533411a5261eSBarry Smith + name - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 53354099cc6bSBarry Smith - function - routine to convert to subtype 53364099cc6bSBarry Smith 53374099cc6bSBarry Smith Notes: 533811a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 53394099cc6bSBarry Smith 53404099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 53414099cc6bSBarry Smith $ -mat_seqaij_type my_mat 53424099cc6bSBarry Smith 53434099cc6bSBarry Smith Level: advanced 53444099cc6bSBarry Smith 5345db781477SPatrick Sanan .seealso: `MatSeqAIJRegisterAll()` 53464099cc6bSBarry Smith @*/ 5347d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5348d71ae5a4SJacob Faibussowitsch { 53494099cc6bSBarry Smith PetscFunctionBegin; 53509566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 53519566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 53524099cc6bSBarry Smith PetscFunctionReturn(0); 53534099cc6bSBarry Smith } 53544099cc6bSBarry Smith 53554099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 53564099cc6bSBarry Smith 53574099cc6bSBarry Smith /*@C 535811a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 53594099cc6bSBarry Smith 53604099cc6bSBarry Smith Not Collective 53614099cc6bSBarry Smith 53624099cc6bSBarry Smith Level: advanced 53634099cc6bSBarry Smith 5364db781477SPatrick Sanan .seealso: `MatRegisterAll()`, `MatSeqAIJRegister()` 53654099cc6bSBarry Smith @*/ 5366d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5367d71ae5a4SJacob Faibussowitsch { 53684099cc6bSBarry Smith PetscFunctionBegin; 53694099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 53704099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 53714099cc6bSBarry Smith 53729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 53739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 53749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 53759779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 53769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5377485f9817SRichard Tran Mills #endif 53785063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 53799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 53805063d097SStefano Zampini #endif 53815063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 53829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 53835063d097SStefano Zampini #endif 53844099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 53859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 53864099cc6bSBarry Smith #endif 53874099cc6bSBarry Smith PetscFunctionReturn(0); 53884099cc6bSBarry Smith } 538953dd7562SDmitry Karpeev 539053dd7562SDmitry Karpeev /* 539181824310SBarry Smith Special version for direct calls from Fortran 539281824310SBarry Smith */ 5393af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 539481824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 539581824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 539681824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 539781824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 539881824310SBarry Smith #endif 539981824310SBarry Smith 540081824310SBarry Smith /* Change these macros so can be used in void function */ 540198921bdaSJacob Faibussowitsch 540298921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 54039566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 54049566063dSJacob Faibussowitsch #undef PetscCall 54059371c9d4SSatish Balay #define PetscCall(...) \ 54069371c9d4SSatish Balay do { \ 54075f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 540898921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 540998921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 541098921bdaSJacob Faibussowitsch return; \ 541198921bdaSJacob Faibussowitsch } \ 541298921bdaSJacob Faibussowitsch } while (0) 541398921bdaSJacob Faibussowitsch 541498921bdaSJacob Faibussowitsch #undef SETERRQ 54159371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 54169371c9d4SSatish Balay do { \ 541798921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 541898921bdaSJacob Faibussowitsch return; \ 541998921bdaSJacob Faibussowitsch } while (0) 542081824310SBarry Smith 5421d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5422d71ae5a4SJacob Faibussowitsch { 542381824310SBarry Smith Mat A = *AA; 542481824310SBarry Smith PetscInt m = *mm, n = *nn; 542581824310SBarry Smith InsertMode is = *isis; 542681824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 542781824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 542881824310SBarry Smith PetscInt *imax, *ai, *ailen; 542981824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 543054f21887SBarry Smith MatScalar *ap, value, *aa; 5431ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5432ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 543381824310SBarry Smith 543481824310SBarry Smith PetscFunctionBegin; 54354994cf47SJed Brown MatCheckPreallocated(A, 1); 543681824310SBarry Smith imax = a->imax; 543781824310SBarry Smith ai = a->i; 543881824310SBarry Smith ailen = a->ilen; 543981824310SBarry Smith aj = a->j; 544081824310SBarry Smith aa = a->a; 544181824310SBarry Smith 544281824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 544381824310SBarry Smith row = im[k]; 544481824310SBarry Smith if (row < 0) continue; 54455f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 54469371c9d4SSatish Balay rp = aj + ai[row]; 54479371c9d4SSatish Balay ap = aa + ai[row]; 54489371c9d4SSatish Balay rmax = imax[row]; 54499371c9d4SSatish Balay nrow = ailen[row]; 545081824310SBarry Smith low = 0; 545181824310SBarry Smith high = nrow; 545281824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 545381824310SBarry Smith if (in[l] < 0) continue; 54545f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 545581824310SBarry Smith col = in[l]; 54562205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 54572205254eSKarl Rupp else value = v[k + l * m]; 54582205254eSKarl Rupp 545981824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 546081824310SBarry Smith 54612205254eSKarl Rupp if (col <= lastcol) low = 0; 54622205254eSKarl Rupp else high = nrow; 546381824310SBarry Smith lastcol = col; 546481824310SBarry Smith while (high - low > 5) { 546581824310SBarry Smith t = (low + high) / 2; 546681824310SBarry Smith if (rp[t] > col) high = t; 546781824310SBarry Smith else low = t; 546881824310SBarry Smith } 546981824310SBarry Smith for (i = low; i < high; i++) { 547081824310SBarry Smith if (rp[i] > col) break; 547181824310SBarry Smith if (rp[i] == col) { 547281824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 547381824310SBarry Smith else ap[i] = value; 547481824310SBarry Smith goto noinsert; 547581824310SBarry Smith } 547681824310SBarry Smith } 547781824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 547881824310SBarry Smith if (nonew == 1) goto noinsert; 54795f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5480fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 54819371c9d4SSatish Balay N = nrow++ - 1; 54829371c9d4SSatish Balay a->nz++; 54839371c9d4SSatish Balay high++; 548481824310SBarry Smith /* shift up all the later entries in this row */ 548581824310SBarry Smith for (ii = N; ii >= i; ii--) { 548681824310SBarry Smith rp[ii + 1] = rp[ii]; 548781824310SBarry Smith ap[ii + 1] = ap[ii]; 548881824310SBarry Smith } 548981824310SBarry Smith rp[i] = col; 549081824310SBarry Smith ap[i] = value; 5491e56f5c9eSBarry Smith A->nonzerostate++; 549281824310SBarry Smith noinsert:; 549381824310SBarry Smith low = i + 1; 549481824310SBarry Smith } 549581824310SBarry Smith ailen[row] = nrow; 549681824310SBarry Smith } 549781824310SBarry Smith PetscFunctionReturnVoid(); 549881824310SBarry Smith } 549998921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 550098921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 550198921bdaSJacob Faibussowitsch * original definitions */ 55029566063dSJacob Faibussowitsch #undef PetscCall 550398921bdaSJacob Faibussowitsch #undef SETERRQ 5504