1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 11d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 12d71ae5a4SJacob Faibussowitsch { 134099cc6bSBarry Smith PetscBool flg; 144099cc6bSBarry Smith char type[256]; 154099cc6bSBarry Smith 164099cc6bSBarry Smith PetscFunctionBegin; 17d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 189566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 199566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 20d0609cedSBarry Smith PetscOptionsEnd(); 214099cc6bSBarry Smith PetscFunctionReturn(0); 224099cc6bSBarry Smith } 234099cc6bSBarry Smith 24d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 25d71ae5a4SJacob Faibussowitsch { 260716a85fSBarry Smith PetscInt i, m, n; 270716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 280716a85fSBarry Smith 290716a85fSBarry Smith PetscFunctionBegin; 309566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 319566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 320716a85fSBarry Smith if (type == NORM_2) { 33ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 340716a85fSBarry Smith } else if (type == NORM_1) { 35ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 360716a85fSBarry Smith } else if (type == NORM_INFINITY) { 37ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 38857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 39ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 40857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 42857cbf51SRichard Tran Mills } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 430716a85fSBarry Smith 440716a85fSBarry Smith if (type == NORM_2) { 45a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 47a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 480716a85fSBarry Smith } 490716a85fSBarry Smith PetscFunctionReturn(0); 500716a85fSBarry Smith } 510716a85fSBarry Smith 52d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 53d71ae5a4SJacob Faibussowitsch { 543a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 553a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 563a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 573a062f41SBarry Smith PetscInt *rows; 583a062f41SBarry Smith 593a062f41SBarry Smith PetscFunctionBegin; 603a062f41SBarry Smith for (i = 0; i < m; i++) { 61ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 623a062f41SBarry Smith } 639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 643a062f41SBarry Smith cnt = 0; 653a062f41SBarry Smith for (i = 0; i < m; i++) { 663a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 673a062f41SBarry Smith rows[cnt] = i; 683a062f41SBarry Smith cnt++; 693a062f41SBarry Smith } 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 723a062f41SBarry Smith PetscFunctionReturn(0); 733a062f41SBarry Smith } 743a062f41SBarry Smith 75d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 76d71ae5a4SJacob Faibussowitsch { 776ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 78fff043a9SJunchao Zhang const MatScalar *aa; 796ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 80b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 816ce1633cSBarry Smith PetscInt *rows; 826ce1633cSBarry Smith 836ce1633cSBarry Smith PetscFunctionBegin; 849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 859566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 866ce1633cSBarry Smith diag = a->diag; 876ce1633cSBarry Smith for (i = 0; i < m; i++) { 88ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 896ce1633cSBarry Smith } 909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 916ce1633cSBarry Smith cnt = 0; 926ce1633cSBarry Smith for (i = 0; i < m; i++) { 93ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 946ce1633cSBarry Smith } 95f1f41ecbSJed Brown *nrows = cnt; 96f1f41ecbSJed Brown *zrows = rows; 979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 98f1f41ecbSJed Brown PetscFunctionReturn(0); 99f1f41ecbSJed Brown } 100f1f41ecbSJed Brown 101d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 102d71ae5a4SJacob Faibussowitsch { 103f1f41ecbSJed Brown PetscInt nrows, *rows; 104f1f41ecbSJed Brown 105f1f41ecbSJed Brown PetscFunctionBegin; 1060298fd71SBarry Smith *zrows = NULL; 1079566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1089566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1096ce1633cSBarry Smith PetscFunctionReturn(0); 1106ce1633cSBarry Smith } 1116ce1633cSBarry Smith 112d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 113d71ae5a4SJacob Faibussowitsch { 114b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 115b3a44c85SBarry Smith const MatScalar *aa; 116b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 117b3a44c85SBarry Smith const PetscInt *ii; 118b3a44c85SBarry Smith PetscInt n, i, j, *rows; 119b3a44c85SBarry Smith 120b3a44c85SBarry Smith PetscFunctionBegin; 1219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 122f4259b30SLisandro Dalcin *keptrows = NULL; 123b3a44c85SBarry Smith ii = a->i; 124b3a44c85SBarry Smith for (i = 0; i < m; i++) { 125b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 126b3a44c85SBarry Smith if (!n) { 127b3a44c85SBarry Smith cnt++; 128b3a44c85SBarry Smith goto ok1; 129b3a44c85SBarry Smith } 1302e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 131b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 132b3a44c85SBarry Smith } 133b3a44c85SBarry Smith cnt++; 134b3a44c85SBarry Smith ok1:; 135b3a44c85SBarry Smith } 1362e5835c6SStefano Zampini if (!cnt) { 1379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1382e5835c6SStefano Zampini PetscFunctionReturn(0); 1392e5835c6SStefano Zampini } 1409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 141b3a44c85SBarry Smith cnt = 0; 142b3a44c85SBarry Smith for (i = 0; i < m; i++) { 143b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 144b3a44c85SBarry Smith if (!n) continue; 1452e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 146b3a44c85SBarry Smith if (aa[j] != 0.0) { 147b3a44c85SBarry Smith rows[cnt++] = i; 148b3a44c85SBarry Smith break; 149b3a44c85SBarry Smith } 150b3a44c85SBarry Smith } 151b3a44c85SBarry Smith } 1529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1539566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 154b3a44c85SBarry Smith PetscFunctionReturn(0); 155b3a44c85SBarry Smith } 156b3a44c85SBarry Smith 157d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 158d71ae5a4SJacob Faibussowitsch { 15979299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16099e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16199e65526SBarry Smith const PetscInt *diag; 1622e5835c6SStefano Zampini MatScalar *aa; 16399e65526SBarry Smith const PetscScalar *v; 164ace3abfcSBarry Smith PetscBool missing; 16579299369SBarry Smith 16679299369SBarry Smith PetscFunctionBegin; 16709f38230SBarry Smith if (Y->assembled) { 1689566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 16909f38230SBarry Smith if (!missing) { 17079299369SBarry Smith diag = aij->diag; 1719566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 17379299369SBarry Smith if (is == INSERT_VALUES) { 174ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 17579299369SBarry Smith } else { 176ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 17779299369SBarry Smith } 1789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1799566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 18079299369SBarry Smith PetscFunctionReturn(0); 18179299369SBarry Smith } 1829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 18309f38230SBarry Smith } 1849566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 18509f38230SBarry Smith PetscFunctionReturn(0); 18609f38230SBarry Smith } 18779299369SBarry Smith 188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 189d71ae5a4SJacob Faibussowitsch { 190416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19197f1f81fSBarry Smith PetscInt i, ishift; 19217ab2063SBarry Smith 1933a40ed3dSBarry Smith PetscFunctionBegin; 194f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 1953a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 196bfeeae90SHong Zhang ishift = 0; 197b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 1989566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 199bfeeae90SHong Zhang } else if (oshift == 1) { 2001a83f524SJed Brown PetscInt *tia; 201d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2023b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2041a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2051a83f524SJed Brown *ia = tia; 206ecc77c7aSBarry Smith if (ja) { 2071a83f524SJed Brown PetscInt *tja; 2089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2091a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2101a83f524SJed Brown *ja = tja; 211ecc77c7aSBarry Smith } 2126945ee14SBarry Smith } else { 213ecc77c7aSBarry Smith *ia = a->i; 214ecc77c7aSBarry Smith if (ja) *ja = a->j; 215a2ce50c7SBarry Smith } 2163a40ed3dSBarry Smith PetscFunctionReturn(0); 217a2744918SBarry Smith } 218a2744918SBarry Smith 219d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 220d71ae5a4SJacob Faibussowitsch { 2213a40ed3dSBarry Smith PetscFunctionBegin; 2223a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 223b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2249566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2259566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 226bcd2baecSBarry Smith } 2273a40ed3dSBarry Smith PetscFunctionReturn(0); 22817ab2063SBarry Smith } 22917ab2063SBarry Smith 230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 231d71ae5a4SJacob Faibussowitsch { 2323b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 233d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 23497f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2353b2fbd54SBarry Smith 2363a40ed3dSBarry Smith PetscFunctionBegin; 237899cda47SBarry Smith *nn = n; 2383a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2393b2fbd54SBarry Smith if (symmetric) { 2409566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2413b2fbd54SBarry Smith } else { 2429566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2453b2fbd54SBarry Smith jj = a->j; 246ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2473b2fbd54SBarry Smith cia[0] = oshift; 248ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2499566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2503b2fbd54SBarry Smith jj = a->j; 251a93ec695SBarry Smith for (row = 0; row < m; row++) { 252a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 253a93ec695SBarry Smith for (i = 0; i < mr; i++) { 254bfeeae90SHong Zhang col = *jj++; 2552205254eSKarl Rupp 2563b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2573b2fbd54SBarry Smith } 2583b2fbd54SBarry Smith } 2599566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2609371c9d4SSatish Balay *ia = cia; 2619371c9d4SSatish Balay *ja = cja; 2623b2fbd54SBarry Smith } 2633a40ed3dSBarry Smith PetscFunctionReturn(0); 2643b2fbd54SBarry Smith } 2653b2fbd54SBarry Smith 266d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 267d71ae5a4SJacob Faibussowitsch { 2683a40ed3dSBarry Smith PetscFunctionBegin; 2693a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2703b2fbd54SBarry Smith 2719566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2729566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2733a40ed3dSBarry Smith PetscFunctionReturn(0); 2743b2fbd54SBarry Smith } 2753b2fbd54SBarry Smith 2767cee066cSHong Zhang /* 2777cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2787cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 279040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2807cee066cSHong Zhang */ 281d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 282d71ae5a4SJacob Faibussowitsch { 2837cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2847cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 285071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2867cee066cSHong Zhang PetscInt *cspidx; 287071fcb05SBarry Smith const PetscInt *jj; 2887cee066cSHong Zhang 2897cee066cSHong Zhang PetscFunctionBegin; 2907cee066cSHong Zhang *nn = n; 2917cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 292625f6d37SHong Zhang 2939566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2959566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2969566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 2977cee066cSHong Zhang jj = a->j; 298ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2997cee066cSHong Zhang cia[0] = oshift; 300ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3019566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3027cee066cSHong Zhang jj = a->j; 3037cee066cSHong Zhang for (row = 0; row < m; row++) { 3047cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3057cee066cSHong Zhang for (i = 0; i < mr; i++) { 3067cee066cSHong Zhang col = *jj++; 307071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 308071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 309071fcb05SBarry Smith cja[tmp] = row + oshift; 3107cee066cSHong Zhang } 3117cee066cSHong Zhang } 3129566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 313071fcb05SBarry Smith *ia = cia; 314071fcb05SBarry Smith *ja = cja; 3157cee066cSHong Zhang *spidx = cspidx; 3167cee066cSHong Zhang PetscFunctionReturn(0); 3177cee066cSHong Zhang } 3187cee066cSHong Zhang 319d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 320d71ae5a4SJacob Faibussowitsch { 3217cee066cSHong Zhang PetscFunctionBegin; 3229566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3239566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3247cee066cSHong Zhang PetscFunctionReturn(0); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 328d71ae5a4SJacob Faibussowitsch { 32987d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33087d4246cSBarry Smith PetscInt *ai = a->i; 331fff043a9SJunchao Zhang PetscScalar *aa; 33287d4246cSBarry Smith 33387d4246cSBarry Smith PetscFunctionBegin; 3349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3359566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 33787d4246cSBarry Smith PetscFunctionReturn(0); 33887d4246cSBarry Smith } 33987d4246cSBarry Smith 340bd04181cSBarry Smith /* 341bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 342bd04181cSBarry Smith 343bd04181cSBarry Smith - a single row of values is set with each call 344bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 345bd04181cSBarry Smith - the values are always added to the matrix, not set 346bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 347bd04181cSBarry Smith 3481f763a69SBarry Smith This does NOT assume the global column indices are sorted 349bd04181cSBarry Smith 3501f763a69SBarry Smith */ 351bd04181cSBarry Smith 352af0996ceSBarry Smith #include <petsc/private/isimpl.h> 353d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 354d71ae5a4SJacob Faibussowitsch { 355189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3561f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3571f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3581f763a69SBarry Smith PetscInt lastcol = -1; 359fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 360189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 361189e4007SBarry Smith 362fff043a9SJunchao Zhang PetscFunctionBegin; 3639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 364f38dd0b8SBarry Smith row = ridx[im[0]]; 3651f763a69SBarry Smith rp = aj + ai[row]; 3661f763a69SBarry Smith ap = aa + ai[row]; 3671f763a69SBarry Smith nrow = ailen[row]; 368189e4007SBarry Smith low = 0; 369189e4007SBarry Smith high = nrow; 370189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 371189e4007SBarry Smith col = cidx[in[l]]; 372f38dd0b8SBarry Smith value = v[l]; 373189e4007SBarry Smith 374189e4007SBarry Smith if (col <= lastcol) low = 0; 375189e4007SBarry Smith else high = nrow; 376189e4007SBarry Smith lastcol = col; 377189e4007SBarry Smith while (high - low > 5) { 378189e4007SBarry Smith t = (low + high) / 2; 379189e4007SBarry Smith if (rp[t] > col) high = t; 380189e4007SBarry Smith else low = t; 381189e4007SBarry Smith } 382189e4007SBarry Smith for (i = low; i < high; i++) { 383189e4007SBarry Smith if (rp[i] == col) { 3841f763a69SBarry Smith ap[i] += value; 385189e4007SBarry Smith low = i + 1; 3861f763a69SBarry Smith break; 387189e4007SBarry Smith } 388189e4007SBarry Smith } 389189e4007SBarry Smith } 3909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 391f38dd0b8SBarry Smith return 0; 392189e4007SBarry Smith } 393189e4007SBarry Smith 394d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 395d71ae5a4SJacob Faibussowitsch { 396416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 397e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 39897f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 399e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 400ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 401ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 402ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 40317ab2063SBarry Smith 4043a40ed3dSBarry Smith PetscFunctionBegin; 4059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 40617ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 407416022c9SBarry Smith row = im[k]; 4085ef9f2a5SBarry Smith if (row < 0) continue; 4096bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 410720833daSHong Zhang rp = aj + ai[row]; 411876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 4129371c9d4SSatish Balay rmax = imax[row]; 4139371c9d4SSatish Balay nrow = ailen[row]; 414416022c9SBarry Smith low = 0; 415c71e6ed7SBarry Smith high = nrow; 41617ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4175ef9f2a5SBarry Smith if (in[l] < 0) continue; 4186bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 419bfeeae90SHong Zhang col = in[l]; 420071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 421071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 42236db0b34SBarry Smith 4232205254eSKarl Rupp if (col <= lastcol) low = 0; 4242205254eSKarl Rupp else high = nrow; 425e2ee6c50SBarry Smith lastcol = col; 426416022c9SBarry Smith while (high - low > 5) { 427416022c9SBarry Smith t = (low + high) / 2; 428416022c9SBarry Smith if (rp[t] > col) high = t; 429416022c9SBarry Smith else low = t; 43017ab2063SBarry Smith } 431416022c9SBarry Smith for (i = low; i < high; i++) { 43217ab2063SBarry Smith if (rp[i] > col) break; 43317ab2063SBarry Smith if (rp[i] == col) { 434876c6284SHong Zhang if (!A->structure_only) { 4350c0d7e18SFande Kong if (is == ADD_VALUES) { 4360c0d7e18SFande Kong ap[i] += value; 4370c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4389371c9d4SSatish Balay } else ap[i] = value; 439720833daSHong Zhang } 440e44c0bd4SBarry Smith low = i + 1; 44117ab2063SBarry Smith goto noinsert; 44217ab2063SBarry Smith } 44317ab2063SBarry Smith } 444dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 445c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 44608401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 447720833daSHong Zhang if (A->structure_only) { 448876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 449720833daSHong Zhang } else { 450fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 451720833daSHong Zhang } 4529371c9d4SSatish Balay N = nrow++ - 1; 4539371c9d4SSatish Balay a->nz++; 4549371c9d4SSatish Balay high++; 455416022c9SBarry Smith /* shift up all the later entries in this row */ 4569566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 45717ab2063SBarry Smith rp[i] = col; 458580bdb30SBarry Smith if (!A->structure_only) { 4599566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 460580bdb30SBarry Smith ap[i] = value; 461580bdb30SBarry Smith } 462416022c9SBarry Smith low = i + 1; 463e56f5c9eSBarry Smith A->nonzerostate++; 464e44c0bd4SBarry Smith noinsert:; 46517ab2063SBarry Smith } 46617ab2063SBarry Smith ailen[row] = nrow; 46717ab2063SBarry Smith } 4689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4693a40ed3dSBarry Smith PetscFunctionReturn(0); 47017ab2063SBarry Smith } 47117ab2063SBarry Smith 472d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 473d71ae5a4SJacob Faibussowitsch { 47419b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 47519b08ed1SBarry Smith PetscInt *rp, k, row; 47619b08ed1SBarry Smith PetscInt *ai = a->i; 47719b08ed1SBarry Smith PetscInt *aj = a->j; 478fff043a9SJunchao Zhang MatScalar *aa, *ap; 47919b08ed1SBarry Smith 48019b08ed1SBarry Smith PetscFunctionBegin; 48128b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 48208401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 483fff043a9SJunchao Zhang 4849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 48519b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 48619b08ed1SBarry Smith row = im[k]; 48719b08ed1SBarry Smith rp = aj + ai[row]; 48819b08ed1SBarry Smith ap = aa + ai[row]; 48919b08ed1SBarry Smith 4909566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49119b08ed1SBarry Smith if (!A->structure_only) { 49219b08ed1SBarry Smith if (v) { 4939566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 49419b08ed1SBarry Smith v += n; 49519b08ed1SBarry Smith } else { 4969566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 49719b08ed1SBarry Smith } 49819b08ed1SBarry Smith } 49919b08ed1SBarry Smith a->ilen[row] = n; 50019b08ed1SBarry Smith a->imax[row] = n; 50119b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 50219b08ed1SBarry Smith a->nz += n; 50319b08ed1SBarry Smith } 5049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 50519b08ed1SBarry Smith PetscFunctionReturn(0); 50619b08ed1SBarry Smith } 50719b08ed1SBarry Smith 50819b08ed1SBarry Smith /*@ 50919b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51019b08ed1SBarry Smith 51119b08ed1SBarry Smith Input Parameters: 51211a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 51319b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 51419b08ed1SBarry Smith 51519b08ed1SBarry Smith Level: advanced 51619b08ed1SBarry Smith 51719b08ed1SBarry Smith Notes: 51819b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 51911a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52019b08ed1SBarry Smith as always with multiple matrix assemblies. 52119b08ed1SBarry Smith 522db781477SPatrick Sanan .seealso: `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 52319b08ed1SBarry Smith @*/ 52419b08ed1SBarry Smith 525d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 526d71ae5a4SJacob Faibussowitsch { 52719b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 52819b08ed1SBarry Smith 52919b08ed1SBarry Smith PetscFunctionBegin; 5309566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5319566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53219b08ed1SBarry Smith a->maxnz = nztotal; 5334dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 53419b08ed1SBarry Smith if (!a->ilen) { 5359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 53619b08ed1SBarry Smith } else { 5379566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 53819b08ed1SBarry Smith } 53919b08ed1SBarry Smith 54019b08ed1SBarry Smith /* allocate the matrix space */ 54119b08ed1SBarry Smith if (A->structure_only) { 5429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal, &a->j)); 5439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i)); 54419b08ed1SBarry Smith } else { 5459566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i)); 54619b08ed1SBarry Smith } 54719b08ed1SBarry Smith a->i[0] = 0; 54819b08ed1SBarry Smith if (A->structure_only) { 54919b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 55019b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55119b08ed1SBarry Smith } else { 55219b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 55319b08ed1SBarry Smith a->free_a = PETSC_TRUE; 55419b08ed1SBarry Smith } 55519b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 55619b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 55719b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 55819b08ed1SBarry Smith PetscFunctionReturn(0); 55919b08ed1SBarry Smith } 56019b08ed1SBarry Smith 561d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 562d71ae5a4SJacob Faibussowitsch { 563071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 564071fcb05SBarry Smith PetscInt *rp, k, row; 565071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 566071fcb05SBarry Smith PetscInt *aj = a->j; 567fff043a9SJunchao Zhang MatScalar *aa, *ap; 568071fcb05SBarry Smith 569071fcb05SBarry Smith PetscFunctionBegin; 5709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 571071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 572071fcb05SBarry Smith row = im[k]; 5736bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 574071fcb05SBarry Smith rp = aj + ai[row]; 575071fcb05SBarry Smith ap = aa + ai[row]; 57648a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 577071fcb05SBarry Smith if (!A->structure_only) { 578071fcb05SBarry Smith if (v) { 5799566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 580071fcb05SBarry Smith v += n; 581071fcb05SBarry Smith } else { 5829566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 583071fcb05SBarry Smith } 584071fcb05SBarry Smith } 585071fcb05SBarry Smith ailen[row] = n; 586071fcb05SBarry Smith a->nz += n; 587071fcb05SBarry Smith } 5889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 589071fcb05SBarry Smith PetscFunctionReturn(0); 590071fcb05SBarry Smith } 591071fcb05SBarry Smith 592d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 593d71ae5a4SJacob Faibussowitsch { 5947eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 59597f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59697f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 597*4e208921SJed Brown const MatScalar *ap, *aa; 5987eb43aa7SLois Curfman McInnes 5993a40ed3dSBarry Smith PetscFunctionBegin; 600*4e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6017eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6027eb43aa7SLois Curfman McInnes row = im[k]; 6039371c9d4SSatish Balay if (row < 0) { 6049371c9d4SSatish Balay v += n; 6059371c9d4SSatish Balay continue; 6069371c9d4SSatish Balay } /* negative row */ 60754c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6089371c9d4SSatish Balay rp = aj + ai[row]; 6099371c9d4SSatish Balay ap = aa + ai[row]; 6107eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6117eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6129371c9d4SSatish Balay if (in[l] < 0) { 6139371c9d4SSatish Balay v++; 6149371c9d4SSatish Balay continue; 6159371c9d4SSatish Balay } /* negative column */ 61654c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 617bfeeae90SHong Zhang col = in[l]; 6189371c9d4SSatish Balay high = nrow; 6199371c9d4SSatish Balay low = 0; /* assume unsorted */ 6207eb43aa7SLois Curfman McInnes while (high - low > 5) { 6217eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6227eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6237eb43aa7SLois Curfman McInnes else low = t; 6247eb43aa7SLois Curfman McInnes } 6257eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6267eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6277eb43aa7SLois Curfman McInnes if (rp[i] == col) { 628b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6297eb43aa7SLois Curfman McInnes goto finished; 6307eb43aa7SLois Curfman McInnes } 6317eb43aa7SLois Curfman McInnes } 63297e567efSBarry Smith *v++ = 0.0; 6337eb43aa7SLois Curfman McInnes finished:; 6347eb43aa7SLois Curfman McInnes } 6357eb43aa7SLois Curfman McInnes } 636*4e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6373a40ed3dSBarry Smith PetscFunctionReturn(0); 6387eb43aa7SLois Curfman McInnes } 6397eb43aa7SLois Curfman McInnes 640d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 641d71ae5a4SJacob Faibussowitsch { 6423ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 643c898d852SStefano Zampini const PetscScalar *av; 6443ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6453ea6fe3dSLisandro Dalcin PetscInt *rowlens; 64617ab2063SBarry Smith 6473a40ed3dSBarry Smith PetscFunctionBegin; 6489566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6492205254eSKarl Rupp 6503ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6513ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6523ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6533ea6fe3dSLisandro Dalcin nz = A->nz; 654416022c9SBarry Smith 6553ea6fe3dSLisandro Dalcin /* write matrix header */ 6563ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6579371c9d4SSatish Balay header[1] = M; 6589371c9d4SSatish Balay header[2] = N; 6599371c9d4SSatish Balay header[3] = nz; 6609566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 661416022c9SBarry Smith 6623ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6643ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6659566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6669566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6673ea6fe3dSLisandro Dalcin /* store column indices */ 6689566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 669416022c9SBarry Smith /* store nonzero values */ 6709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6719566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 673b37d52dbSMark F. Adams 6743ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6759566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6763a40ed3dSBarry Smith PetscFunctionReturn(0); 67717ab2063SBarry Smith } 678416022c9SBarry Smith 679d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 680d71ae5a4SJacob Faibussowitsch { 6817dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6827dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6837dc0baabSHong Zhang 6847dc0baabSHong Zhang PetscFunctionBegin; 6859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6867dc0baabSHong Zhang for (i = 0; i < m; i++) { 6879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 68848a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6907dc0baabSHong Zhang } 6919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6927dc0baabSHong Zhang PetscFunctionReturn(0); 6937dc0baabSHong Zhang } 6947dc0baabSHong Zhang 69509573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 696cd155464SBarry Smith 697d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 698d71ae5a4SJacob Faibussowitsch { 699416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 700c898d852SStefano Zampini const PetscScalar *av; 70160e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 702e060cb09SBarry Smith const char *name; 703f3ef73ceSBarry Smith PetscViewerFormat format; 70417ab2063SBarry Smith 7053a40ed3dSBarry Smith PetscFunctionBegin; 7067dc0baabSHong Zhang if (A->structure_only) { 7079566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7087dc0baabSHong Zhang PetscFunctionReturn(0); 7097dc0baabSHong Zhang } 71043e49210SHong Zhang 7119566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 7122e5835c6SStefano Zampini if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 7132e5835c6SStefano Zampini 714c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 71771c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 71897f1f81fSBarry Smith PetscInt nofinalvalue = 0; 71960e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 720c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 721d00d2cf4SBarry Smith nofinalvalue = 1; 722d00d2cf4SBarry Smith } 7239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 726fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 728fbfe6fa7SJed Brown #else 7299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 730fbfe6fa7SJed Brown #endif 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73217ab2063SBarry Smith 73317ab2063SBarry Smith for (i = 0; i < m; i++) { 73460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 735aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 73717ab2063SBarry Smith #else 7389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 73917ab2063SBarry Smith #endif 74017ab2063SBarry Smith } 74117ab2063SBarry Smith } 742d00d2cf4SBarry Smith if (nofinalvalue) { 743c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 745c337ccceSJed Brown #else 7469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 747c337ccceSJed Brown #endif 748d00d2cf4SBarry Smith } 7499566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 752fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 75444cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 75660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 757aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 75836db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76036db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76236db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7646831982aSBarry Smith } 76544cd7ae7SLois Curfman McInnes #else 7669566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 76744cd7ae7SLois Curfman McInnes #endif 76844cd7ae7SLois Curfman McInnes } 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77044cd7ae7SLois Curfman McInnes } 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 772fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 77397f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 776496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 777496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 77860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 779496be53dSLois Curfman McInnes if (a->j[j] >= i) { 780aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78136db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 782496be53dSLois Curfman McInnes #else 783496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 784496be53dSLois Curfman McInnes #endif 785496be53dSLois Curfman McInnes } 786496be53dSLois Curfman McInnes } 787496be53dSLois Curfman McInnes } 7882e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7902e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7912205254eSKarl Rupp if (i + 4 < m) { 7929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 7932205254eSKarl Rupp } else if (i + 3 < m) { 7949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 7952205254eSKarl Rupp } else if (i + 2 < m) { 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 7972205254eSKarl Rupp } else if (i + 1 < m) { 7989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 7992205254eSKarl Rupp } else if (i < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8012205254eSKarl Rupp } else { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8032205254eSKarl Rupp } 804496be53dSLois Curfman McInnes } 8059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8069566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 807496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 80860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8099566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 810496be53dSLois Curfman McInnes } 8119566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 812496be53dSLois Curfman McInnes } 8139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 814496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 816496be53dSLois Curfman McInnes if (a->j[j] >= i) { 817aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 81848a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 819496be53dSLois Curfman McInnes #else 8209566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 821496be53dSLois Curfman McInnes #endif 822496be53dSLois Curfman McInnes } 823496be53dSLois Curfman McInnes } 8249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 825496be53dSLois Curfman McInnes } 8269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 827fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 82897f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 82987828ca2SBarry Smith PetscScalar value; 83068f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83168f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83268f1ed48SBarry Smith 83368f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 83468f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 83568f1ed48SBarry Smith realonly = PETSC_FALSE; 83668f1ed48SBarry Smith break; 83768f1ed48SBarry Smith } 83868f1ed48SBarry Smith } 83968f1ed48SBarry Smith #endif 84002594712SBarry Smith 8419566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84202594712SBarry Smith for (i = 0; i < m; i++) { 84302594712SBarry Smith jcnt = 0; 844d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 845e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 84602594712SBarry Smith value = a->a[cnt++]; 847e24b481bSBarry Smith jcnt++; 84802594712SBarry Smith } else { 84902594712SBarry Smith value = 0.0; 85002594712SBarry Smith } 851aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85268f1ed48SBarry Smith if (realonly) { 8539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 85468f1ed48SBarry Smith } else { 8559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 85668f1ed48SBarry Smith } 85702594712SBarry Smith #else 8589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 85902594712SBarry Smith #endif 86002594712SBarry Smith } 8619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86202594712SBarry Smith } 8639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8643c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 865150b93efSMatthew G. Knepley PetscInt fshift = 1; 8669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8673c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8693c215bfdSMatthew Knepley #else 8709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8713c215bfdSMatthew Knepley #endif 8729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8733c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 87460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8773c215bfdSMatthew Knepley #else 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8793c215bfdSMatthew Knepley #endif 8803c215bfdSMatthew Knepley } 8813c215bfdSMatthew Knepley } 8829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8833a40ed3dSBarry Smith } else { 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 885d5f3da31SBarry Smith if (A->factortype) { 88616cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 88816cd7e1dSShri Abhyankar /* L part */ 88960e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89116cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 89316cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 89516cd7e1dSShri Abhyankar } else { 8969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 89716cd7e1dSShri Abhyankar } 89816cd7e1dSShri Abhyankar #else 8999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90016cd7e1dSShri Abhyankar #endif 90116cd7e1dSShri Abhyankar } 90216cd7e1dSShri Abhyankar /* diagonal */ 90316cd7e1dSShri Abhyankar j = a->diag[i]; 90416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 90516cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 90716cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 90916cd7e1dSShri Abhyankar } else { 9109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91116cd7e1dSShri Abhyankar } 91216cd7e1dSShri Abhyankar #else 9139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 91416cd7e1dSShri Abhyankar #endif 91516cd7e1dSShri Abhyankar 91616cd7e1dSShri Abhyankar /* U part */ 91760e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 91816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9229566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 92316cd7e1dSShri Abhyankar } else { 9249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 92516cd7e1dSShri Abhyankar } 92616cd7e1dSShri Abhyankar #else 9279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 92816cd7e1dSShri Abhyankar #endif 92916cd7e1dSShri Abhyankar } 9309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93116cd7e1dSShri Abhyankar } 93216cd7e1dSShri Abhyankar } else { 93317ab2063SBarry Smith for (i = 0; i < m; i++) { 9349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 93560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 936aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 93736db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 93936db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9413a40ed3dSBarry Smith } else { 9429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 94317ab2063SBarry Smith } 94417ab2063SBarry Smith #else 9459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 94617ab2063SBarry Smith #endif 94717ab2063SBarry Smith } 9489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 94917ab2063SBarry Smith } 95016cd7e1dSShri Abhyankar } 9519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95217ab2063SBarry Smith } 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9543a40ed3dSBarry Smith PetscFunctionReturn(0); 955416022c9SBarry Smith } 956416022c9SBarry Smith 9579804daf3SBarry Smith #include <petscdraw.h> 958d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 959d71ae5a4SJacob Faibussowitsch { 960480ef9eaSBarry Smith Mat A = (Mat)Aa; 961416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 962383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 963383922c3SLisandro Dalcin int color; 964b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 965b0a32e0cSBarry Smith PetscViewer viewer; 966f3ef73ceSBarry Smith PetscViewerFormat format; 967fff043a9SJunchao Zhang const PetscScalar *aa; 968cddf8d76SBarry Smith 9693a40ed3dSBarry Smith PetscFunctionBegin; 9709566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9719566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9729566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 973383922c3SLisandro Dalcin 974416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 976fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 977d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9780513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 979b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 980416022c9SBarry Smith for (i = 0; i < m; i++) { 9819371c9d4SSatish Balay y_l = m - i - 1.0; 9829371c9d4SSatish Balay y_r = y_l + 1.0; 983bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9849371c9d4SSatish Balay x_l = a->j[j]; 9859371c9d4SSatish Balay x_r = x_l + 1.0; 986fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9879566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 988cddf8d76SBarry Smith } 989cddf8d76SBarry Smith } 990b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 991cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9929371c9d4SSatish Balay y_l = m - i - 1.0; 9939371c9d4SSatish Balay y_r = y_l + 1.0; 994bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9959371c9d4SSatish Balay x_l = a->j[j]; 9969371c9d4SSatish Balay x_r = x_l + 1.0; 997fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 9989566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 999cddf8d76SBarry Smith } 1000cddf8d76SBarry Smith } 1001b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1002cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10039371c9d4SSatish Balay y_l = m - i - 1.0; 10049371c9d4SSatish Balay y_r = y_l + 1.0; 1005bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10069371c9d4SSatish Balay x_l = a->j[j]; 10079371c9d4SSatish Balay x_r = x_l + 1.0; 1008fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10099566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1010416022c9SBarry Smith } 1011416022c9SBarry Smith } 1012d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10130513a670SBarry Smith } else { 10140513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10150513a670SBarry Smith /* first determine max of all nonzero values */ 1016b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1017383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1018b0a32e0cSBarry Smith PetscDraw popup; 10190513a670SBarry Smith 10200513a670SBarry Smith for (i = 0; i < nz; i++) { 1021fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10220513a670SBarry Smith } 1023383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10249566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10259566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1026383922c3SLisandro Dalcin 1027d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10280513a670SBarry Smith for (i = 0; i < m; i++) { 1029383922c3SLisandro Dalcin y_l = m - i - 1.0; 1030383922c3SLisandro Dalcin y_r = y_l + 1.0; 1031bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1032383922c3SLisandro Dalcin x_l = a->j[j]; 1033383922c3SLisandro Dalcin x_r = x_l + 1.0; 1034fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10359566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10360513a670SBarry Smith count++; 10370513a670SBarry Smith } 10380513a670SBarry Smith } 1039d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10400513a670SBarry Smith } 10419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1042480ef9eaSBarry Smith PetscFunctionReturn(0); 1043480ef9eaSBarry Smith } 1044cddf8d76SBarry Smith 10459804daf3SBarry Smith #include <petscdraw.h> 1046d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1047d71ae5a4SJacob Faibussowitsch { 1048b0a32e0cSBarry Smith PetscDraw draw; 104936db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1050ace3abfcSBarry Smith PetscBool isnull; 1051480ef9eaSBarry Smith 1052480ef9eaSBarry Smith PetscFunctionBegin; 10539566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10549566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 1055480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 1056480ef9eaSBarry Smith 10579371c9d4SSatish Balay xr = A->cmap->n; 10589371c9d4SSatish Balay yr = A->rmap->n; 10599371c9d4SSatish Balay h = yr / 10.0; 10609371c9d4SSatish Balay w = xr / 10.0; 10619371c9d4SSatish Balay xr += w; 10629371c9d4SSatish Balay yr += h; 10639371c9d4SSatish Balay xl = -w; 10649371c9d4SSatish Balay yl = -h; 10659566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10669566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10679566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10689566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10699566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10703a40ed3dSBarry Smith PetscFunctionReturn(0); 1071416022c9SBarry Smith } 1072416022c9SBarry Smith 1073d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1074d71ae5a4SJacob Faibussowitsch { 1075ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1076416022c9SBarry Smith 10773a40ed3dSBarry Smith PetscFunctionBegin; 10789566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10799566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10809566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10811baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10821baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10831baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10849566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10853a40ed3dSBarry Smith PetscFunctionReturn(0); 108617ab2063SBarry Smith } 108719bcc07fSBarry Smith 1088d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1089d71ae5a4SJacob Faibussowitsch { 1090416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1091580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1092d0f46423SBarry Smith PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0; 109354f21887SBarry Smith MatScalar *aa = a->a, *ap; 10943447b6efSHong Zhang PetscReal ratio = 0.6; 109517ab2063SBarry Smith 10963a40ed3dSBarry Smith PetscFunctionBegin; 10973a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 10989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1099b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1100b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11019566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 1102b215bc84SStefano Zampini PetscFunctionReturn(0); 1103b215bc84SStefano Zampini } 110417ab2063SBarry Smith 110543ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 110617ab2063SBarry Smith for (i = 1; i < m; i++) { 1107416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 110817ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 110994a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111017ab2063SBarry Smith if (fshift) { 1111bfeeae90SHong Zhang ip = aj + ai[i]; 1112bfeeae90SHong Zhang ap = aa + ai[i]; 111317ab2063SBarry Smith N = ailen[i]; 11149566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 111548a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 111617ab2063SBarry Smith } 111717ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 111817ab2063SBarry Smith } 111917ab2063SBarry Smith if (m) { 112017ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112117ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112217ab2063SBarry Smith } 11237b083b7cSBarry Smith 112417ab2063SBarry Smith /* reset ilen and imax for each row */ 11257b083b7cSBarry Smith a->nonzerorowcnt = 0; 1126396832f4SHong Zhang if (A->structure_only) { 11279566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11289566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1129396832f4SHong Zhang } else { /* !A->structure_only */ 113017ab2063SBarry Smith for (i = 0; i < m; i++) { 113117ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11327b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113317ab2063SBarry Smith } 1134396832f4SHong Zhang } 1135bfeeae90SHong Zhang a->nz = ai[m]; 1136aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 113717ab2063SBarry Smith 11389566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 11399566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11409566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11419566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11422205254eSKarl Rupp 11438e58a170SBarry Smith A->info.mallocs += a->reallocs; 1144dd5f02e7SSatish Balay a->reallocs = 0; 11456712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 114636db0b34SBarry Smith a->rmax = rmax; 11474e220ebcSLois Curfman McInnes 114848a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11499566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11503a40ed3dSBarry Smith PetscFunctionReturn(0); 115117ab2063SBarry Smith } 115217ab2063SBarry Smith 1153d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1154d71ae5a4SJacob Faibussowitsch { 115599cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 115699cafbc1SBarry Smith PetscInt i, nz = a->nz; 11572e5835c6SStefano Zampini MatScalar *aa; 115899cafbc1SBarry Smith 115999cafbc1SBarry Smith PetscFunctionBegin; 11609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 116199cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 116499cafbc1SBarry Smith PetscFunctionReturn(0); 116599cafbc1SBarry Smith } 116699cafbc1SBarry Smith 1167d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1168d71ae5a4SJacob Faibussowitsch { 116999cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 117099cafbc1SBarry Smith PetscInt i, nz = a->nz; 11712e5835c6SStefano Zampini MatScalar *aa; 117299cafbc1SBarry Smith 117399cafbc1SBarry Smith PetscFunctionBegin; 11749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117599cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 117899cafbc1SBarry Smith PetscFunctionReturn(0); 117999cafbc1SBarry Smith } 118099cafbc1SBarry Smith 1181d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1182d71ae5a4SJacob Faibussowitsch { 1183fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1184fff043a9SJunchao Zhang MatScalar *aa; 11853a40ed3dSBarry Smith 11863a40ed3dSBarry Smith PetscFunctionBegin; 11879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 11889566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 11899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 11909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11913a40ed3dSBarry Smith PetscFunctionReturn(0); 119217ab2063SBarry Smith } 1193416022c9SBarry Smith 1194d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatResetPreallocationCOO_SeqAIJ(Mat A) 1195d71ae5a4SJacob Faibussowitsch { 1196cbc6b225SStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1197cbc6b225SStefano Zampini 1198cbc6b225SStefano Zampini PetscFunctionBegin; 11999566063dSJacob Faibussowitsch PetscCall(PetscFree(a->perm)); 12009566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jmap)); 1201cbc6b225SStefano Zampini PetscFunctionReturn(0); 1202cbc6b225SStefano Zampini } 1203cbc6b225SStefano Zampini 1204d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1205d71ae5a4SJacob Faibussowitsch { 1206416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1207d5d45c9bSBarry Smith 12083a40ed3dSBarry Smith PetscFunctionBegin; 1209aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1210c0aa6a63SJacob Faibussowitsch PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz); 121117ab2063SBarry Smith #endif 12129566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12139566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(A)); 12149566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12159566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12169566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12179566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12189566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12199566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12209566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12219566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12229566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12239566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12259566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12269566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1228901853e0SKris Buschelman 12296718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12306718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12316718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12326718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12336718818eSStefano Zampini due to different matrix sizes */ 12349566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12356718818eSStefano Zampini 12369566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12372e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12382e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12452e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12462e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12472e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12482e956fe4SStefano Zampini #endif 12494222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12534222ddf1SHong Zhang #endif 12543d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12563d0639e7SStefano Zampini #endif 12579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1258af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1260af8000cdSHong Zhang #endif 1261d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1263d24d4204SJose E. Roman #endif 126463c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 126763c07aadSStefano Zampini #endif 12689566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12722e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12832e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12842e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12852e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12862e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 12872e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 12882e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 12892e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 12903a40ed3dSBarry Smith PetscFunctionReturn(0); 129117ab2063SBarry Smith } 129217ab2063SBarry Smith 1293d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1294d71ae5a4SJacob Faibussowitsch { 1295416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 12963a40ed3dSBarry Smith 12973a40ed3dSBarry Smith PetscFunctionBegin; 1298a65d3064SKris Buschelman switch (op) { 1299d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1300d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1301d71ae5a4SJacob Faibussowitsch break; 1302d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1303d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1304d71ae5a4SJacob Faibussowitsch break; 1305d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1306d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1307d71ae5a4SJacob Faibussowitsch break; 1308d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1309d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1310d71ae5a4SJacob Faibussowitsch break; 1311d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1312d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1313d71ae5a4SJacob Faibussowitsch break; 1314d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1315d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1316d71ae5a4SJacob Faibussowitsch break; 1317d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1318d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1319d71ae5a4SJacob Faibussowitsch break; 13203d472b54SHong Zhang case MAT_SPD: 1321b1646e73SJed Brown case MAT_SYMMETRIC: 1322b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1323b1646e73SJed Brown case MAT_HERMITIAN: 1324b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1325957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1326b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1327b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1328b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13295021d80fSJed Brown break; 13308c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1331a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1332d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1333d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1334d71ae5a4SJacob Faibussowitsch break; 1335d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1336d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1337d71ae5a4SJacob Faibussowitsch break; 1338d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1339d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1340d71ae5a4SJacob Faibussowitsch break; 1341071fcb05SBarry Smith case MAT_SORTED_FULL: 1342071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1343071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1344071fcb05SBarry Smith break; 1345d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1346d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1347d71ae5a4SJacob Faibussowitsch break; 1348d71ae5a4SJacob Faibussowitsch default: 1349d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1350a65d3064SKris Buschelman } 13513a40ed3dSBarry Smith PetscFunctionReturn(0); 135217ab2063SBarry Smith } 135317ab2063SBarry Smith 1354d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1355d71ae5a4SJacob Faibussowitsch { 1356416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1357fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1358c898d852SStefano Zampini PetscScalar *x; 1359c898d852SStefano Zampini const PetscScalar *aa; 136017ab2063SBarry Smith 13613a40ed3dSBarry Smith PetscFunctionBegin; 13629566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 136308401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1365d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1366d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13679566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13682c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13699566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 137135e7444dSHong Zhang PetscFunctionReturn(0); 137235e7444dSHong Zhang } 137335e7444dSHong Zhang 13749566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 137535e7444dSHong Zhang for (i = 0; i < n; i++) { 1376fdc842d1SBarry Smith x[i] = 0.0; 137735e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 137835e7444dSHong Zhang if (aj[j] == i) { 137935e7444dSHong Zhang x[i] = aa[j]; 138017ab2063SBarry Smith break; 138117ab2063SBarry Smith } 138217ab2063SBarry Smith } 138317ab2063SBarry Smith } 13849566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13863a40ed3dSBarry Smith PetscFunctionReturn(0); 138717ab2063SBarry Smith } 138817ab2063SBarry Smith 1389c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1390d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1391d71ae5a4SJacob Faibussowitsch { 1392416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13935f22a7b3SSebastian Grimberg const MatScalar *aa; 1394d9ca1df4SBarry Smith PetscScalar *y; 1395d9ca1df4SBarry Smith const PetscScalar *x; 1396d0f46423SBarry Smith PetscInt m = A->rmap->n; 13975c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 13985f22a7b3SSebastian Grimberg const MatScalar *v; 1399a77337e4SBarry Smith PetscScalar alpha; 1400d9ca1df4SBarry Smith PetscInt n, i, j; 1401d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14023447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1403ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14045c897100SBarry Smith #endif 140517ab2063SBarry Smith 14063a40ed3dSBarry Smith PetscFunctionBegin; 14079566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14089566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14099566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14115c897100SBarry Smith 14125c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1413fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14145c897100SBarry Smith #else 14153447b6efSHong Zhang if (usecprow) { 14163447b6efSHong Zhang m = cprow.nrows; 14173447b6efSHong Zhang ii = cprow.i; 14187b2bb3b9SHong Zhang ridx = cprow.rindex; 14193447b6efSHong Zhang } else { 14203447b6efSHong Zhang ii = a->i; 14213447b6efSHong Zhang } 142217ab2063SBarry Smith for (i = 0; i < m; i++) { 14233447b6efSHong Zhang idx = a->j + ii[i]; 1424fff043a9SJunchao Zhang v = aa + ii[i]; 14253447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14263447b6efSHong Zhang if (usecprow) { 14277b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14283447b6efSHong Zhang } else { 142917ab2063SBarry Smith alpha = x[i]; 14303447b6efSHong Zhang } 143104fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 143217ab2063SBarry Smith } 14335c897100SBarry Smith #endif 14349566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14359566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14369566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14383a40ed3dSBarry Smith PetscFunctionReturn(0); 143917ab2063SBarry Smith } 144017ab2063SBarry Smith 1441d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1442d71ae5a4SJacob Faibussowitsch { 14435c897100SBarry Smith PetscFunctionBegin; 14449566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14459566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14465c897100SBarry Smith PetscFunctionReturn(0); 14475c897100SBarry Smith } 14485c897100SBarry Smith 1449c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 145078b84d54SShri Abhyankar 1451d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1452d71ae5a4SJacob Faibussowitsch { 1453416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1454d9fead3dSBarry Smith PetscScalar *y; 145554f21887SBarry Smith const PetscScalar *x; 1456fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1457003131ecSBarry Smith PetscInt m = A->rmap->n; 14580298fd71SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 14597b083b7cSBarry Smith PetscInt n, i; 1460362ced78SSatish Balay PetscScalar sum; 1461ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 146217ab2063SBarry Smith 1463b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 146497952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1465fee21e36SBarry Smith #endif 1466fee21e36SBarry Smith 14673a40ed3dSBarry Smith PetscFunctionBegin; 1468b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14699566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 1470b215bc84SStefano Zampini PetscFunctionReturn(0); 1471b215bc84SStefano Zampini } 14729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14739566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14749566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1475416022c9SBarry Smith ii = a->i; 14764eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14779566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 147897952fefSHong Zhang m = a->compressedrow.nrows; 147997952fefSHong Zhang ii = a->compressedrow.i; 148097952fefSHong Zhang ridx = a->compressedrow.rindex; 148197952fefSHong Zhang for (i = 0; i < m; i++) { 148297952fefSHong Zhang n = ii[i + 1] - ii[i]; 148397952fefSHong Zhang aj = a->j + ii[i]; 1484fff043a9SJunchao Zhang aa = a_a + ii[i]; 148597952fefSHong Zhang sum = 0.0; 1486003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1487003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 148897952fefSHong Zhang y[*ridx++] = sum; 148997952fefSHong Zhang } 149097952fefSHong Zhang } else { /* do not use compressed row format */ 1491b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 14923d3eaba7SBarry Smith aj = a->j; 1493fff043a9SJunchao Zhang aa = a_a; 1494b05257ddSBarry Smith fortranmultaij_(&m, x, ii, aj, aa, y); 1495b05257ddSBarry Smith #else 149617ab2063SBarry Smith for (i = 0; i < m; i++) { 1497003131ecSBarry Smith n = ii[i + 1] - ii[i]; 1498003131ecSBarry Smith aj = a->j + ii[i]; 1499fff043a9SJunchao Zhang aa = a_a + ii[i]; 150017ab2063SBarry Smith sum = 0.0; 1501003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 150217ab2063SBarry Smith y[i] = sum; 150317ab2063SBarry Smith } 15048d195f9aSBarry Smith #endif 1505b05257ddSBarry Smith } 15069566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15079566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15089566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15103a40ed3dSBarry Smith PetscFunctionReturn(0); 151117ab2063SBarry Smith } 151217ab2063SBarry Smith 1513d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1514d71ae5a4SJacob Faibussowitsch { 1515b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1516b434eb95SMatthew G. Knepley PetscScalar *y; 1517b434eb95SMatthew G. Knepley const PetscScalar *x; 1518fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1519b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1520b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1521b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1522b434eb95SMatthew G. Knepley PetscScalar sum; 1523b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1524b434eb95SMatthew G. Knepley 1525b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1526b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1527b434eb95SMatthew G. Knepley #endif 1528b434eb95SMatthew G. Knepley 1529b434eb95SMatthew G. Knepley PetscFunctionBegin; 15309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15319566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15329566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1533b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1534b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1535b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1536b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1537b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1538b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1539b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1540fff043a9SJunchao Zhang aa = a_a + ii[i]; 1541b434eb95SMatthew G. Knepley sum = 0.0; 1542b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1543b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1544b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1545b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1546b434eb95SMatthew G. Knepley } 1547b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15483d3eaba7SBarry Smith ii = a->i; 1549b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1550b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1551b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1552fff043a9SJunchao Zhang aa = a_a + ii[i]; 1553b434eb95SMatthew G. Knepley sum = 0.0; 1554b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1555b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1556b434eb95SMatthew G. Knepley y[i] = sum; 1557b434eb95SMatthew G. Knepley } 1558b434eb95SMatthew G. Knepley } 15599566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15609566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15619566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 1563b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1564b434eb95SMatthew G. Knepley } 1565b434eb95SMatthew G. Knepley 1566d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1567d71ae5a4SJacob Faibussowitsch { 1568b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1569b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1570b434eb95SMatthew G. Knepley const PetscScalar *x; 1571fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1572b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1573b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1574b434eb95SMatthew G. Knepley PetscScalar sum; 1575b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1576b434eb95SMatthew G. Knepley 1577b434eb95SMatthew G. Knepley PetscFunctionBegin; 15789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15809566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1581b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 158248a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1583b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1584b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1585b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1586b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1587b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1588b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1589fff043a9SJunchao Zhang aa = a_a + ii[i]; 1590b434eb95SMatthew G. Knepley sum = y[*ridx]; 1591b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1592b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1593b434eb95SMatthew G. Knepley } 1594b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15953d3eaba7SBarry Smith ii = a->i; 1596b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1597b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1598b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1599fff043a9SJunchao Zhang aa = a_a + ii[i]; 1600b434eb95SMatthew G. Knepley sum = y[i]; 1601b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1602b434eb95SMatthew G. Knepley z[i] = sum; 1603b434eb95SMatthew G. Knepley } 1604b434eb95SMatthew G. Knepley } 16059566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16069566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16079566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 1609b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1610b434eb95SMatthew G. Knepley } 1611b434eb95SMatthew G. Knepley 1612c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1613d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1614d71ae5a4SJacob Faibussowitsch { 1615416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1616f15663dcSBarry Smith PetscScalar *y, *z; 1617f15663dcSBarry Smith const PetscScalar *x; 1618fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1619d9ca1df4SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 1620d9ca1df4SBarry Smith PetscInt m = A->rmap->n, n, i; 1621362ced78SSatish Balay PetscScalar sum; 1622ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16239ea0dfa2SSatish Balay 16243a40ed3dSBarry Smith PetscFunctionBegin; 1625b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16269566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 1627b215bc84SStefano Zampini PetscFunctionReturn(0); 1628b215bc84SStefano Zampini } 16299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16309566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16319566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16324eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 163348a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 163497952fefSHong Zhang m = a->compressedrow.nrows; 163597952fefSHong Zhang ii = a->compressedrow.i; 163697952fefSHong Zhang ridx = a->compressedrow.rindex; 163797952fefSHong Zhang for (i = 0; i < m; i++) { 163897952fefSHong Zhang n = ii[i + 1] - ii[i]; 163997952fefSHong Zhang aj = a->j + ii[i]; 1640fff043a9SJunchao Zhang aa = a_a + ii[i]; 164197952fefSHong Zhang sum = y[*ridx]; 1642f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 164397952fefSHong Zhang z[*ridx++] = sum; 164497952fefSHong Zhang } 164597952fefSHong Zhang } else { /* do not use compressed row format */ 16463d3eaba7SBarry Smith ii = a->i; 1647f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16483d3eaba7SBarry Smith aj = a->j; 1649fff043a9SJunchao Zhang aa = a_a; 1650f15663dcSBarry Smith fortranmultaddaij_(&m, x, ii, aj, aa, y, z); 1651f15663dcSBarry Smith #else 165217ab2063SBarry Smith for (i = 0; i < m; i++) { 1653f15663dcSBarry Smith n = ii[i + 1] - ii[i]; 1654f15663dcSBarry Smith aj = a->j + ii[i]; 1655fff043a9SJunchao Zhang aa = a_a + ii[i]; 165617ab2063SBarry Smith sum = y[i]; 1657f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165817ab2063SBarry Smith z[i] = sum; 165917ab2063SBarry Smith } 166002ab625aSSatish Balay #endif 1661f15663dcSBarry Smith } 16629566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16639566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16649566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16663a40ed3dSBarry Smith PetscFunctionReturn(0); 166717ab2063SBarry Smith } 166817ab2063SBarry Smith 166917ab2063SBarry Smith /* 167017ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 167117ab2063SBarry Smith */ 1672d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1673d71ae5a4SJacob Faibussowitsch { 1674416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1675d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1676c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 167717ab2063SBarry Smith 16783a40ed3dSBarry Smith PetscFunctionBegin; 167909f38230SBarry Smith if (!a->diag) { 16809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1681c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 168209f38230SBarry Smith } 1683d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1684c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1685c0c07093SJunchao Zhang if (alreadySet) { 1686c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1687c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1688c0c07093SJunchao Zhang } 1689c0c07093SJunchao Zhang 169009f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1691bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1692bfeeae90SHong Zhang if (a->j[j] == i) { 169309f38230SBarry Smith a->diag[i] = j; 169417ab2063SBarry Smith break; 169517ab2063SBarry Smith } 169617ab2063SBarry Smith } 169717ab2063SBarry Smith } 16983a40ed3dSBarry Smith PetscFunctionReturn(0); 169917ab2063SBarry Smith } 170017ab2063SBarry Smith 1701d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1702d71ae5a4SJacob Faibussowitsch { 170361ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 170461ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 170561ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 170661ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 170761ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 170861ecd0c6SBarry Smith 170961ecd0c6SBarry Smith PetscFunctionBegin; 171061ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17129566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 171361ecd0c6SBarry Smith PetscFunctionReturn(0); 171461ecd0c6SBarry Smith } 171561ecd0c6SBarry Smith 171661ecd0c6SBarry Smith if (a->diagonaldense) { 171761ecd0c6SBarry Smith cnt = 0; 171861ecd0c6SBarry Smith } else { 17199566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 172061ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1721349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 172261ecd0c6SBarry Smith cnt++; 172361ecd0c6SBarry Smith mdiag[i] = 1; 172461ecd0c6SBarry Smith } 172561ecd0c6SBarry Smith } 172661ecd0c6SBarry Smith } 172761ecd0c6SBarry Smith if (!cnt) { 17289566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 172961ecd0c6SBarry Smith } else { 1730b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1731b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 173261ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij; 173361ecd0c6SBarry Smith 173461ecd0c6SBarry Smith a->a = NULL; 173561ecd0c6SBarry Smith a->j = NULL; 173661ecd0c6SBarry Smith a->i = NULL; 173761ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1738ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 174061ecd0c6SBarry Smith 174161ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 174261ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17439566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 174448a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1745447d62f5SStefano Zampini } 17469566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17479566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 174861ecd0c6SBarry Smith if (singlemalloc) { 17499566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda, oldj, oldi)); 175061ecd0c6SBarry Smith } else { 17519566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17529566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17539566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 175461ecd0c6SBarry Smith } 175561ecd0c6SBarry Smith } 17569566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 175761ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 175861ecd0c6SBarry Smith PetscFunctionReturn(0); 175961ecd0c6SBarry Smith } 176061ecd0c6SBarry Smith 1761be5855fcSBarry Smith /* 1762be5855fcSBarry Smith Checks for missing diagonals 1763be5855fcSBarry Smith */ 1764d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1765d71ae5a4SJacob Faibussowitsch { 1766be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17677734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1768be5855fcSBarry Smith 1769be5855fcSBarry Smith PetscFunctionBegin; 177009f38230SBarry Smith *missing = PETSC_FALSE; 17717734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 177209f38230SBarry Smith *missing = PETSC_TRUE; 177309f38230SBarry Smith if (d) *d = 0; 17749566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 177509f38230SBarry Smith } else { 177601445905SHong Zhang PetscInt n; 177701445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1778f1e2ffcdSBarry Smith diag = a->diag; 177901445905SHong Zhang for (i = 0; i < n; i++) { 17807734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 178109f38230SBarry Smith *missing = PETSC_TRUE; 178209f38230SBarry Smith if (d) *d = i; 17839566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1784358d2f5dSShri Abhyankar break; 178509f38230SBarry Smith } 1786be5855fcSBarry Smith } 1787be5855fcSBarry Smith } 1788be5855fcSBarry Smith PetscFunctionReturn(0); 1789be5855fcSBarry Smith } 1790be5855fcSBarry Smith 17910da83c2eSBarry Smith #include <petscblaslapack.h> 17920da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 17930da83c2eSBarry Smith 17940da83c2eSBarry Smith /* 17950da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 17960da83c2eSBarry Smith */ 1797d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1798d71ae5a4SJacob Faibussowitsch { 17990da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18000da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18010da83c2eSBarry Smith const PetscReal shift = 0.0; 18020da83c2eSBarry Smith PetscInt ipvt[5]; 1803*4e208921SJed Brown PetscCount flops = 0; 18040da83c2eSBarry Smith PetscScalar work[25], *v_work; 18050da83c2eSBarry Smith 18060da83c2eSBarry Smith PetscFunctionBegin; 18070da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18080da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 180908401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1810ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 181248a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18130da83c2eSBarry Smith ncnt = 0; 18140da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18150da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18169566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18170da83c2eSBarry Smith switch (bsizes[i]) { 1818d71ae5a4SJacob Faibussowitsch case 1: 1819d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1820d71ae5a4SJacob Faibussowitsch break; 18210da83c2eSBarry Smith case 2: 18229566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18230da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18249566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18250da83c2eSBarry Smith break; 18260da83c2eSBarry Smith case 3: 18279566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18280da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18299566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18300da83c2eSBarry Smith break; 18310da83c2eSBarry Smith case 4: 18329566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18330da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18349566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18350da83c2eSBarry Smith break; 18360da83c2eSBarry Smith case 5: 18379566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18380da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18399566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18400da83c2eSBarry Smith break; 18410da83c2eSBarry Smith case 6: 18429566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18430da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18449566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18450da83c2eSBarry Smith break; 18460da83c2eSBarry Smith case 7: 18479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18480da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18499566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18500da83c2eSBarry Smith break; 18510da83c2eSBarry Smith default: 18529566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18530da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18549566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18550da83c2eSBarry Smith } 18560da83c2eSBarry Smith ncnt += bsizes[i]; 18570da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 1858*4e208921SJed Brown flops += 2 * PetscPowInt(bsizes[i], 3) / 3; 18590da83c2eSBarry Smith } 1860*4e208921SJed Brown PetscLogFlops(flops); 186148a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18629566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18630da83c2eSBarry Smith PetscFunctionReturn(0); 18640da83c2eSBarry Smith } 18650da83c2eSBarry Smith 1866422a814eSBarry Smith /* 1867422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1868422a814eSBarry Smith */ 1869d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1870d71ae5a4SJacob Faibussowitsch { 187171f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1872d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18732e5835c6SStefano Zampini const MatScalar *v; 187454f21887SBarry Smith PetscScalar *idiag, *mdiag; 187571f1c65dSBarry Smith 187671f1c65dSBarry Smith PetscFunctionBegin; 187771f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 18789566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 187971f1c65dSBarry Smith diag = a->diag; 18804dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18812e5835c6SStefano Zampini 188271f1c65dSBarry Smith mdiag = a->mdiag; 188371f1c65dSBarry Smith idiag = a->idiag; 18849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1885422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 188671f1c65dSBarry Smith for (i = 0; i < m; i++) { 188771f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1888899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1889899639b0SHong Zhang if (PetscRealPart(fshift)) { 18909566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 18917b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18927b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 18937b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 189498921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1895899639b0SHong Zhang } 189671f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 189771f1c65dSBarry Smith } 18989566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 189971f1c65dSBarry Smith } else { 190071f1c65dSBarry Smith for (i = 0; i < m; i++) { 190171f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 190271f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 190371f1c65dSBarry Smith } 19049566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 190571f1c65dSBarry Smith } 190671f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 190871f1c65dSBarry Smith PetscFunctionReturn(0); 190971f1c65dSBarry Smith } 191071f1c65dSBarry Smith 1911c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 1912d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1913d71ae5a4SJacob Faibussowitsch { 1914416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1915e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19162e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 191754f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19183d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 191997f1f81fSBarry Smith const PetscInt *idx, *diag; 192017ab2063SBarry Smith 19213a40ed3dSBarry Smith PetscFunctionBegin; 1922b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19239566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 1924b215bc84SStefano Zampini PetscFunctionReturn(0); 1925b215bc84SStefano Zampini } 1926b965ef7fSBarry Smith its = its * lits; 192791723122SBarry Smith 192871f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19299566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 193071f1c65dSBarry Smith a->fshift = fshift; 193171f1c65dSBarry Smith a->omega = omega; 1932ed480e8bSBarry Smith 193371f1c65dSBarry Smith diag = a->diag; 193471f1c65dSBarry Smith t = a->ssor_work; 1935ed480e8bSBarry Smith idiag = a->idiag; 193671f1c65dSBarry Smith mdiag = a->mdiag; 1937ed480e8bSBarry Smith 19389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19399566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19409566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1941ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 194217ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 194317ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1944ed480e8bSBarry Smith bs = b; 194517ab2063SBarry Smith for (i = 0; i < m; i++) { 194671f1c65dSBarry Smith d = fshift + mdiag[i]; 1947416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1948ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19492e5835c6SStefano Zampini v = aa + diag[i] + 1; 195017ab2063SBarry Smith sum = b[i] * d / omega; 1951003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 195217ab2063SBarry Smith x[i] = sum; 195317ab2063SBarry Smith } 19549566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19559566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19579566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19583a40ed3dSBarry Smith PetscFunctionReturn(0); 195917ab2063SBarry Smith } 1960c783ea89SBarry Smith 196108401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1962f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19634c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1964887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 196517ab2063SBarry Smith 196617ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 196717ab2063SBarry Smith 1968887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 196917ab2063SBarry Smith */ 197017ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 197117ab2063SBarry Smith 197217ab2063SBarry Smith /* x = (E + U)^{-1} b */ 197317ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1974416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1975ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19762e5835c6SStefano Zampini v = aa + diag[i] + 1; 197717ab2063SBarry Smith sum = b[i]; 1978e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1979ed480e8bSBarry Smith x[i] = sum * idiag[i]; 198017ab2063SBarry Smith } 198117ab2063SBarry Smith 198217ab2063SBarry Smith /* t = b - (2*E - D)x */ 19832e5835c6SStefano Zampini v = aa; 19842205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 198517ab2063SBarry Smith 198617ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1987ed480e8bSBarry Smith ts = t; 1988416022c9SBarry Smith diag = a->diag; 198917ab2063SBarry Smith for (i = 0; i < m; i++) { 1990416022c9SBarry Smith n = diag[i] - a->i[i]; 1991ed480e8bSBarry Smith idx = a->j + a->i[i]; 19922e5835c6SStefano Zampini v = aa + a->i[i]; 199317ab2063SBarry Smith sum = t[i]; 1994003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 1995ed480e8bSBarry Smith t[i] = sum * idiag[i]; 1996733d66baSBarry Smith /* x = x + t */ 1997733d66baSBarry Smith x[i] += t[i]; 199817ab2063SBarry Smith } 199917ab2063SBarry Smith 20009566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20019566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20029566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20033a40ed3dSBarry Smith PetscFunctionReturn(0); 200417ab2063SBarry Smith } 200517ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 200617ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 200717ab2063SBarry Smith for (i = 0; i < m; i++) { 2008416022c9SBarry Smith n = diag[i] - a->i[i]; 2009ed480e8bSBarry Smith idx = a->j + a->i[i]; 20102e5835c6SStefano Zampini v = aa + a->i[i]; 201117ab2063SBarry Smith sum = b[i]; 2012e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20135c99c7daSBarry Smith t[i] = sum; 2014ed480e8bSBarry Smith x[i] = sum * idiag[i]; 201517ab2063SBarry Smith } 20165c99c7daSBarry Smith xb = t; 20179566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20183a40ed3dSBarry Smith } else xb = b; 201917ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 202017ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2021416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2022ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20232e5835c6SStefano Zampini v = aa + diag[i] + 1; 202417ab2063SBarry Smith sum = xb[i]; 2025e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20265c99c7daSBarry Smith if (xb == b) { 2027ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20285c99c7daSBarry Smith } else { 2029b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 203017ab2063SBarry Smith } 20315c99c7daSBarry Smith } 20329566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 203317ab2063SBarry Smith } 203417ab2063SBarry Smith its--; 203517ab2063SBarry Smith } 203617ab2063SBarry Smith while (its--) { 203717ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 203817ab2063SBarry Smith for (i = 0; i < m; i++) { 2039b19a5dc2SMark Adams /* lower */ 2040b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2041ed480e8bSBarry Smith idx = a->j + a->i[i]; 20422e5835c6SStefano Zampini v = aa + a->i[i]; 204317ab2063SBarry Smith sum = b[i]; 2044e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2045b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2046b19a5dc2SMark Adams /* upper */ 2047b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2048b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20492e5835c6SStefano Zampini v = aa + diag[i] + 1; 2050b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2051b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 205217ab2063SBarry Smith } 2053b19a5dc2SMark Adams xb = t; 20549566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2055b19a5dc2SMark Adams } else xb = b; 205617ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 205717ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2058b19a5dc2SMark Adams sum = xb[i]; 2059b19a5dc2SMark Adams if (xb == b) { 2060b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2061416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2062ed480e8bSBarry Smith idx = a->j + a->i[i]; 20632e5835c6SStefano Zampini v = aa + a->i[i]; 2064e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2065ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2066b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2067b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2068b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20692e5835c6SStefano Zampini v = aa + diag[i] + 1; 2070b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2071b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 207217ab2063SBarry Smith } 2073b19a5dc2SMark Adams } 2074b19a5dc2SMark Adams if (xb == b) { 20759566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2076b19a5dc2SMark Adams } else { 20779566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2078b19a5dc2SMark Adams } 207917ab2063SBarry Smith } 208017ab2063SBarry Smith } 20819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20829566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20839566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 2084365a8a9eSBarry Smith PetscFunctionReturn(0); 208517ab2063SBarry Smith } 208617ab2063SBarry Smith 2087d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2088d71ae5a4SJacob Faibussowitsch { 2089416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 20904e220ebcSLois Curfman McInnes 20913a40ed3dSBarry Smith PetscFunctionBegin; 20924e220ebcSLois Curfman McInnes info->block_size = 1.0; 20933966268fSBarry Smith info->nz_allocated = a->maxnz; 20943966268fSBarry Smith info->nz_used = a->nz; 20953966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 20963966268fSBarry Smith info->assemblies = A->num_ass; 20973966268fSBarry Smith info->mallocs = A->info.mallocs; 20984dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2099d5f3da31SBarry Smith if (A->factortype) { 21004e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21014e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21024e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21034e220ebcSLois Curfman McInnes } else { 21044e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21054e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21064e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21074e220ebcSLois Curfman McInnes } 21083a40ed3dSBarry Smith PetscFunctionReturn(0); 210917ab2063SBarry Smith } 211017ab2063SBarry Smith 2111d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2112d71ae5a4SJacob Faibussowitsch { 2113416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2114c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 211597b48c8fSBarry Smith const PetscScalar *xx; 21162e5835c6SStefano Zampini PetscScalar *bb, *aa; 2117c7da8527SEric Chamberland PetscInt d = 0; 211817ab2063SBarry Smith 21193a40ed3dSBarry Smith PetscFunctionBegin; 212097b48c8fSBarry Smith if (x && b) { 21219566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21229566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 212397b48c8fSBarry Smith for (i = 0; i < N; i++) { 2124aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2125447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 212697b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 212797b48c8fSBarry Smith } 21289566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21299566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 213097b48c8fSBarry Smith } 213197b48c8fSBarry Smith 21329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2133a9817697SBarry Smith if (a->keepnonzeropattern) { 2134f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2135aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21369566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2137f1e2ffcdSBarry Smith } 2138f4df32b1SMatthew Knepley if (diag != 0.0) { 2139c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2140c7da8527SEric Chamberland d = rows[i]; 2141447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 214208401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2143c7da8527SEric Chamberland } 2144f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2145447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21462e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2147f1e2ffcdSBarry Smith } 2148f1e2ffcdSBarry Smith } 2149f1e2ffcdSBarry Smith } else { 2150f4df32b1SMatthew Knepley if (diag != 0.0) { 215117ab2063SBarry Smith for (i = 0; i < N; i++) { 2152aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21537ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2154447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2155447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2156447d62f5SStefano Zampini } else { 2157416022c9SBarry Smith a->ilen[rows[i]] = 1; 21582e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2159bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2160447d62f5SStefano Zampini } 2161447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21629566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 216317ab2063SBarry Smith } 216417ab2063SBarry Smith } 21653a40ed3dSBarry Smith } else { 216617ab2063SBarry Smith for (i = 0; i < N; i++) { 2167aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2168416022c9SBarry Smith a->ilen[rows[i]] = 0; 216917ab2063SBarry Smith } 217017ab2063SBarry Smith } 2171e56f5c9eSBarry Smith A->nonzerostate++; 2172f1e2ffcdSBarry Smith } 21739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2174dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21753a40ed3dSBarry Smith PetscFunctionReturn(0); 217617ab2063SBarry Smith } 217717ab2063SBarry Smith 2178d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2179d71ae5a4SJacob Faibussowitsch { 21806e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21816e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21822b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 21836e169961SBarry Smith const PetscScalar *xx; 21842e5835c6SStefano Zampini PetscScalar *bb, *aa; 21856e169961SBarry Smith 21866e169961SBarry Smith PetscFunctionBegin; 21872e5835c6SStefano Zampini if (!N) PetscFunctionReturn(0); 21889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 21896e169961SBarry Smith if (x && b) { 21909566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21919566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 21922b40b63fSBarry Smith vecs = PETSC_TRUE; 21936e169961SBarry Smith } 21949566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 21956e169961SBarry Smith for (i = 0; i < N; i++) { 2196aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21979566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 21982205254eSKarl Rupp 21996e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22006e169961SBarry Smith } 22016e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22026e169961SBarry Smith if (!zeroed[i]) { 22036e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22044cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22052e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22062e5835c6SStefano Zampini aa[j] = 0.0; 22076e169961SBarry Smith } 22086e169961SBarry Smith } 22094cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22106e169961SBarry Smith } 22116e169961SBarry Smith if (x && b) { 22129566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22139566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22146e169961SBarry Smith } 22159566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22166e169961SBarry Smith if (diag != 0.0) { 22179566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22181d5a398dSstefano_zampini if (missing) { 22191d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22204cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2221aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22229566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22231d5a398dSstefano_zampini } 22241d5a398dSstefano_zampini } else { 2225ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22266e169961SBarry Smith } 22271d5a398dSstefano_zampini } 22289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2229dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22306e169961SBarry Smith PetscFunctionReturn(0); 22316e169961SBarry Smith } 22326e169961SBarry Smith 2233d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2234d71ae5a4SJacob Faibussowitsch { 2235fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2236fff043a9SJunchao Zhang const PetscScalar *aa; 2237fff043a9SJunchao Zhang PetscInt *itmp; 223817ab2063SBarry Smith 22393a40ed3dSBarry Smith PetscFunctionBegin; 22409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2241416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22422e5835c6SStefano Zampini if (v) *v = (PetscScalar *)(aa + a->i[row]); 224317ab2063SBarry Smith if (idx) { 2244bfeeae90SHong Zhang itmp = a->j + a->i[row]; 224526fbe8dcSKarl Rupp if (*nz) *idx = itmp; 2246f4259b30SLisandro Dalcin else *idx = NULL; 224717ab2063SBarry Smith } 22489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22493a40ed3dSBarry Smith PetscFunctionReturn(0); 225017ab2063SBarry Smith } 225117ab2063SBarry Smith 2252d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2253d71ae5a4SJacob Faibussowitsch { 22543a40ed3dSBarry Smith PetscFunctionBegin; 2255cb4a9cd9SHong Zhang if (nz) *nz = 0; 22562e5835c6SStefano Zampini if (idx) *idx = NULL; 22572e5835c6SStefano Zampini if (v) *v = NULL; 22583a40ed3dSBarry Smith PetscFunctionReturn(0); 225917ab2063SBarry Smith } 226017ab2063SBarry Smith 2261d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2262d71ae5a4SJacob Faibussowitsch { 2263416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22642e5835c6SStefano Zampini const MatScalar *v; 226536db0b34SBarry Smith PetscReal sum = 0.0; 226697f1f81fSBarry Smith PetscInt i, j; 226717ab2063SBarry Smith 22683a40ed3dSBarry Smith PetscFunctionBegin; 22699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 227017ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2271570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2272570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2273792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2274570b7f6dSBarry Smith #else 2275416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22769371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22779371c9d4SSatish Balay v++; 227817ab2063SBarry Smith } 22798f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2280570b7f6dSBarry Smith #endif 22819566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22823a40ed3dSBarry Smith } else if (type == NORM_1) { 228336db0b34SBarry Smith PetscReal *tmp; 228497f1f81fSBarry Smith PetscInt *jj = a->j; 22859566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2286064f8208SBarry Smith *nrm = 0.0; 2287416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 22889371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 22899371c9d4SSatish Balay v++; 229017ab2063SBarry Smith } 2291d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2292064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 229317ab2063SBarry Smith } 22949566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 22959566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 22963a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2297064f8208SBarry Smith *nrm = 0.0; 2298d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 22992e5835c6SStefano Zampini const PetscScalar *v2 = v + a->i[j]; 230017ab2063SBarry Smith sum = 0.0; 2301416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23029371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23039371c9d4SSatish Balay v2++; 230417ab2063SBarry Smith } 2305064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 230617ab2063SBarry Smith } 23079566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2308f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23103a40ed3dSBarry Smith PetscFunctionReturn(0); 231117ab2063SBarry Smith } 231217ab2063SBarry Smith 2313d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2314d71ae5a4SJacob Faibussowitsch { 23153d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 231654f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23172e5835c6SStefano Zampini const MatScalar *va, *vb; 231897f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2319cd0d46ebSvictorle 2320cd0d46ebSvictorle PetscFunctionBegin; 23219566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23229566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23235485867bSBarry Smith if (ma != nb || na != mb) { 23245485867bSBarry Smith *f = PETSC_FALSE; 23255485867bSBarry Smith PetscFunctionReturn(0); 23265485867bSBarry Smith } 23279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23299371c9d4SSatish Balay aii = aij->i; 23309371c9d4SSatish Balay bii = bij->i; 23319371c9d4SSatish Balay adx = aij->j; 23329371c9d4SSatish Balay bdx = bij->j; 23339566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23349566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2335cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2336cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2337cd0d46ebSvictorle 2338cd0d46ebSvictorle *f = PETSC_TRUE; 2339cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2340cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 234197f1f81fSBarry Smith PetscInt idc, idr; 23425485867bSBarry Smith PetscScalar vc, vr; 2343cd0d46ebSvictorle /* column/row index/value */ 23445485867bSBarry Smith idc = adx[aptr[i]]; 23455485867bSBarry Smith idr = bdx[bptr[idc]]; 23465485867bSBarry Smith vc = va[aptr[i]]; 23475485867bSBarry Smith vr = vb[bptr[idc]]; 23485485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23495485867bSBarry Smith *f = PETSC_FALSE; 23505485867bSBarry Smith goto done; 2351cd0d46ebSvictorle } else { 23525485867bSBarry Smith aptr[i]++; 23535485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2354cd0d46ebSvictorle } 2355cd0d46ebSvictorle } 2356cd0d46ebSvictorle } 2357cd0d46ebSvictorle done: 23589566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23599566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 2362cd0d46ebSvictorle PetscFunctionReturn(0); 2363cd0d46ebSvictorle } 2364cd0d46ebSvictorle 2365d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2366d71ae5a4SJacob Faibussowitsch { 23673d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 236854f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 236954f21887SBarry Smith MatScalar *va, *vb; 23701cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23711cbb95d3SBarry Smith 23721cbb95d3SBarry Smith PetscFunctionBegin; 23739566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23749566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23751cbb95d3SBarry Smith if (ma != nb || na != mb) { 23761cbb95d3SBarry Smith *f = PETSC_FALSE; 23771cbb95d3SBarry Smith PetscFunctionReturn(0); 23781cbb95d3SBarry Smith } 23799371c9d4SSatish Balay aii = aij->i; 23809371c9d4SSatish Balay bii = bij->i; 23819371c9d4SSatish Balay adx = aij->j; 23829371c9d4SSatish Balay bdx = bij->j; 23839371c9d4SSatish Balay va = aij->a; 23849371c9d4SSatish Balay vb = bij->a; 23859566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23869566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23871cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 23881cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 23891cbb95d3SBarry Smith 23901cbb95d3SBarry Smith *f = PETSC_TRUE; 23911cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 23921cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 23931cbb95d3SBarry Smith PetscInt idc, idr; 23941cbb95d3SBarry Smith PetscScalar vc, vr; 23951cbb95d3SBarry Smith /* column/row index/value */ 23961cbb95d3SBarry Smith idc = adx[aptr[i]]; 23971cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 23981cbb95d3SBarry Smith vc = va[aptr[i]]; 23991cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24001cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24011cbb95d3SBarry Smith *f = PETSC_FALSE; 24021cbb95d3SBarry Smith goto done; 24031cbb95d3SBarry Smith } else { 24041cbb95d3SBarry Smith aptr[i]++; 24051cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24061cbb95d3SBarry Smith } 24071cbb95d3SBarry Smith } 24081cbb95d3SBarry Smith } 24091cbb95d3SBarry Smith done: 24109566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24119566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24121cbb95d3SBarry Smith PetscFunctionReturn(0); 24131cbb95d3SBarry Smith } 24141cbb95d3SBarry Smith 2415d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2416d71ae5a4SJacob Faibussowitsch { 24179e29f15eSvictorle PetscFunctionBegin; 24189566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f)); 24199e29f15eSvictorle PetscFunctionReturn(0); 24209e29f15eSvictorle } 24219e29f15eSvictorle 2422d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2423d71ae5a4SJacob Faibussowitsch { 24241cbb95d3SBarry Smith PetscFunctionBegin; 24259566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f)); 24261cbb95d3SBarry Smith PetscFunctionReturn(0); 24271cbb95d3SBarry Smith } 24281cbb95d3SBarry Smith 2429d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2430d71ae5a4SJacob Faibussowitsch { 2431416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2432fff8e43fSBarry Smith const PetscScalar *l, *r; 2433fff8e43fSBarry Smith PetscScalar x; 243454f21887SBarry Smith MatScalar *v; 2435fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2436fff8e43fSBarry Smith const PetscInt *jj; 243717ab2063SBarry Smith 24383a40ed3dSBarry Smith PetscFunctionBegin; 243917ab2063SBarry Smith if (ll) { 24403ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24413ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24429566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 244308401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24449566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 244617ab2063SBarry Smith for (i = 0; i < m; i++) { 244717ab2063SBarry Smith x = l[i]; 2448416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24492205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 245017ab2063SBarry Smith } 24519566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24529566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 245417ab2063SBarry Smith } 245517ab2063SBarry Smith if (rr) { 24569566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 245708401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24589566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24602e5835c6SStefano Zampini jj = a->j; 24612205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24639566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24649566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 246517ab2063SBarry Smith } 24669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24673a40ed3dSBarry Smith PetscFunctionReturn(0); 246817ab2063SBarry Smith } 246917ab2063SBarry Smith 2470d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2471d71ae5a4SJacob Faibussowitsch { 2472db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2473d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 247497f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24755d0c19d7SBarry Smith const PetscInt *irow, *icol; 24762e5835c6SStefano Zampini const PetscScalar *aa; 24775d0c19d7SBarry Smith PetscInt nrows, ncols; 247897f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 247954f21887SBarry Smith MatScalar *a_new, *mat_a; 2480416022c9SBarry Smith Mat C; 2481cdc6f3adSToby Isaac PetscBool stride; 248217ab2063SBarry Smith 24833a40ed3dSBarry Smith PetscFunctionBegin; 24849566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24859566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24869566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 248717ab2063SBarry Smith 24889566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2489ff718158SBarry Smith if (stride) { 24909566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2491ff718158SBarry Smith } else { 2492ff718158SBarry Smith first = 0; 2493ff718158SBarry Smith step = 0; 2494ff718158SBarry Smith } 2495fee21e36SBarry Smith if (stride && step == 1) { 249602834360SBarry Smith /* special case of contiguous rows */ 24979566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 249802834360SBarry Smith /* loop over new rows determining lens and starting points */ 249902834360SBarry Smith for (i = 0; i < nrows; i++) { 2500bfeeae90SHong Zhang kstart = ai[irow[i]]; 2501a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2502a91a9bebSLisandro Dalcin starts[i] = kstart; 250302834360SBarry Smith for (k = kstart; k < kend; k++) { 2504bfeeae90SHong Zhang if (aj[k] >= first) { 250502834360SBarry Smith starts[i] = k; 250602834360SBarry Smith break; 250702834360SBarry Smith } 250802834360SBarry Smith } 2509a2744918SBarry Smith sum = 0; 251002834360SBarry Smith while (k < kend) { 2511bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2512a2744918SBarry Smith sum++; 251302834360SBarry Smith } 2514a2744918SBarry Smith lens[i] = sum; 251502834360SBarry Smith } 251602834360SBarry Smith /* create submatrix */ 2517cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 251897f1f81fSBarry Smith PetscInt n_cols, n_rows; 25199566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2520aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25219566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 252208480c60SBarry Smith C = *B; 25233a40ed3dSBarry Smith } else { 25243bef6203SJed Brown PetscInt rbs, cbs; 25259566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25269566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25279566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25289566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25299566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25309566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 253208480c60SBarry Smith } 2533db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2534db02288aSLois Curfman McInnes 253502834360SBarry Smith /* loop over rows inserting into submatrix */ 2536db02288aSLois Curfman McInnes a_new = c->a; 2537db02288aSLois Curfman McInnes j_new = c->j; 2538db02288aSLois Curfman McInnes i_new = c->i; 25399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 254002834360SBarry Smith for (i = 0; i < nrows; i++) { 2541a2744918SBarry Smith ii = starts[i]; 2542a2744918SBarry Smith lensi = lens[i]; 2543ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25449566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2545a2744918SBarry Smith a_new += lensi; 2546a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2547a2744918SBarry Smith c->ilen[i] = lensi; 254802834360SBarry Smith } 25499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25509566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25513a40ed3dSBarry Smith } else { 25529566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25539566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25549566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25554dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25566bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25574dcab191SBarry Smith smap[icol[i]] = i + 1; 25584dcab191SBarry Smith } 25594dcab191SBarry Smith 256002834360SBarry Smith /* determine lens of each row */ 256102834360SBarry Smith for (i = 0; i < nrows; i++) { 2562bfeeae90SHong Zhang kstart = ai[irow[i]]; 256302834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 256402834360SBarry Smith lens[i] = 0; 256502834360SBarry Smith for (k = kstart; k < kend; k++) { 2566ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 256702834360SBarry Smith } 256802834360SBarry Smith } 256917ab2063SBarry Smith /* Create and fill new matrix */ 2570a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2571ace3abfcSBarry Smith PetscBool equal; 25720f5bd95cSBarry Smith 257399141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2574aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25759566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 257628b400f6SJacob Faibussowitsch PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong no of nonzeros"); 25779566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 257808480c60SBarry Smith C = *B; 25793a40ed3dSBarry Smith } else { 25803bef6203SJed Brown PetscInt rbs, cbs; 25819566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25829566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25839566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25849566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25859566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25869566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 258808480c60SBarry Smith } 25899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 259099141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 259117ab2063SBarry Smith for (i = 0; i < nrows; i++) { 259299141d43SSatish Balay row = irow[i]; 2593bfeeae90SHong Zhang kstart = ai[row]; 259499141d43SSatish Balay kend = kstart + a->ilen[row]; 2595bfeeae90SHong Zhang mat_i = c->i[i]; 259699141d43SSatish Balay mat_j = c->j + mat_i; 259799141d43SSatish Balay mat_a = c->a + mat_i; 259899141d43SSatish Balay mat_ilen = c->ilen + i; 259917ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2600bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2601ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26022e5835c6SStefano Zampini *mat_a++ = aa[k]; 260399141d43SSatish Balay (*mat_ilen)++; 260417ab2063SBarry Smith } 260517ab2063SBarry Smith } 260617ab2063SBarry Smith } 26079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 260802834360SBarry Smith /* Free work space */ 26099566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26109566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26119566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2612cdc6f3adSToby Isaac /* sort */ 2613cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2614cdc6f3adSToby Isaac PetscInt ilen; 2615cdc6f3adSToby Isaac 2616cdc6f3adSToby Isaac mat_i = c->i[i]; 2617cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2618cdc6f3adSToby Isaac mat_a = c->a + mat_i; 2619cdc6f3adSToby Isaac ilen = c->ilen[i]; 26209566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2621cdc6f3adSToby Isaac } 262202834360SBarry Smith } 26238c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26249566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2625305c6ccfSStefano Zampini #endif 26269566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26279566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 262817ab2063SBarry Smith 26299566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2630416022c9SBarry Smith *B = C; 26313a40ed3dSBarry Smith PetscFunctionReturn(0); 263217ab2063SBarry Smith } 263317ab2063SBarry Smith 2634d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2635d71ae5a4SJacob Faibussowitsch { 263682d44351SHong Zhang Mat B; 263782d44351SHong Zhang 263882d44351SHong Zhang PetscFunctionBegin; 2639c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26409566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26419566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26429566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26439566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26449566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 264582d44351SHong Zhang *subMat = B; 2646c2d650bdSHong Zhang } else { 26479566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2648c2d650bdSHong Zhang } 264982d44351SHong Zhang PetscFunctionReturn(0); 265082d44351SHong Zhang } 265182d44351SHong Zhang 2652d71ae5a4SJacob Faibussowitsch PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2653d71ae5a4SJacob Faibussowitsch { 265463b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 265563b91edcSBarry Smith Mat outA; 2656ace3abfcSBarry Smith PetscBool row_identity, col_identity; 265763b91edcSBarry Smith 26583a40ed3dSBarry Smith PetscFunctionBegin; 265908401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26601df811f5SHong Zhang 26619566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26629566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2663a871dcd8SBarry Smith 266463b91edcSBarry Smith outA = inA; 2665d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26669566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26679566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26682205254eSKarl Rupp 26699566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26709566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26712205254eSKarl Rupp 2672c3122656SLisandro Dalcin a->row = row; 26732205254eSKarl Rupp 26749566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26759566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26762205254eSKarl Rupp 2677c3122656SLisandro Dalcin a->col = col; 267863b91edcSBarry Smith 267936db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26809566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26819566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2682f0ec6fceSSatish Balay 268394a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26849566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 268594a9d846SBarry Smith } 268663b91edcSBarry Smith 26879566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2688137fb511SHong Zhang if (row_identity && col_identity) { 26899566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2690137fb511SHong Zhang } else { 26919566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2692137fb511SHong Zhang } 26933a40ed3dSBarry Smith PetscFunctionReturn(0); 2694a871dcd8SBarry Smith } 2695a871dcd8SBarry Smith 2696d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2697d71ae5a4SJacob Faibussowitsch { 2698f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2699dfa0f9e5SStefano Zampini PetscScalar *v; 2700c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 27013a40ed3dSBarry Smith 27023a40ed3dSBarry Smith PetscFunctionBegin; 27039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27049566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2705792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27069566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27093a40ed3dSBarry Smith PetscFunctionReturn(0); 2710f0b747eeSBarry Smith } 2711f0b747eeSBarry Smith 2712d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2713d71ae5a4SJacob Faibussowitsch { 271416b64355SHong Zhang PetscInt i; 271516b64355SHong Zhang 271616b64355SHong Zhang PetscFunctionBegin; 271716b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27189566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 271916b64355SHong Zhang 272048a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27219566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 272216b64355SHong Zhang 272316b64355SHong Zhang if (submatj->rbuf1) { 27249566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27259566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 272616b64355SHong Zhang } 272716b64355SHong Zhang 272848a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27299566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27309566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 273116b64355SHong Zhang } 273216b64355SHong Zhang 273316b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 27349566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable *)&submatj->rmap)); 27359566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27369566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 273716b64355SHong Zhang #else 27389566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 273916b64355SHong Zhang #endif 274016b64355SHong Zhang 274116b64355SHong Zhang if (!submatj->allcolumns) { 274216b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 27439566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable *)&submatj->cmap)); 274416b64355SHong Zhang #else 27459566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 274616b64355SHong Zhang #endif 274716b64355SHong Zhang } 27489566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 274916b64355SHong Zhang 27509566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 275116b64355SHong Zhang PetscFunctionReturn(0); 275216b64355SHong Zhang } 275316b64355SHong Zhang 2754d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2755d71ae5a4SJacob Faibussowitsch { 275616b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27575c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 275816b64355SHong Zhang 275916b64355SHong Zhang PetscFunctionBegin; 27609566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27619566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 276216b64355SHong Zhang PetscFunctionReturn(0); 276316b64355SHong Zhang } 276416b64355SHong Zhang 276589a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2766d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2767d71ae5a4SJacob Faibussowitsch { 27682d033e1fSHong Zhang PetscInt i; 27690fb991dcSHong Zhang Mat C; 27700fb991dcSHong Zhang Mat_SeqAIJ *c; 27710fb991dcSHong Zhang Mat_SubSppt *submatj; 27722d033e1fSHong Zhang 27732d033e1fSHong Zhang PetscFunctionBegin; 27742d033e1fSHong Zhang for (i = 0; i < n; i++) { 27750fb991dcSHong Zhang C = (*mat)[i]; 27760fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27770fb991dcSHong Zhang submatj = c->submatis1; 27782d033e1fSHong Zhang if (submatj) { 2779682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 278026cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27819566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27829566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27839566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27843faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27859566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27869566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27879566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2788682e4c99SStefano Zampini } 27892d033e1fSHong Zhang } else { 27909566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 27912d033e1fSHong Zhang } 27922d033e1fSHong Zhang } 279386e85357SHong Zhang 279463a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 27959566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 279663a75b2aSHong Zhang 27979566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 27982d033e1fSHong Zhang PetscFunctionReturn(0); 27992d033e1fSHong Zhang } 28002d033e1fSHong Zhang 2801d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2802d71ae5a4SJacob Faibussowitsch { 280397f1f81fSBarry Smith PetscInt i; 2804cddf8d76SBarry Smith 28053a40ed3dSBarry Smith PetscFunctionBegin; 280648a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2807cddf8d76SBarry Smith 280848a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28093a40ed3dSBarry Smith PetscFunctionReturn(0); 2810cddf8d76SBarry Smith } 2811cddf8d76SBarry Smith 2812d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2813d71ae5a4SJacob Faibussowitsch { 2814e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28159a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28165d0c19d7SBarry Smith const PetscInt *idx; 28179a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2818f1af5d2fSBarry Smith PetscBT table; 2819bbd702dbSSatish Balay 28203a40ed3dSBarry Smith PetscFunctionBegin; 28219a88ca10SBarry Smith m = A->rmap->n / bs; 2822e4d965acSSatish Balay ai = a->i; 2823bfeeae90SHong Zhang aj = a->j; 28248a047759SSatish Balay 282508401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 282606763907SSatish Balay 28279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28289566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 282906763907SSatish Balay 2830e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2831b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2832e4d965acSSatish Balay isz = 0; 28339566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2834e4d965acSSatish Balay 2835e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28369566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28379566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2838e4d965acSSatish Balay 28399a88ca10SBarry Smith if (bs > 1) { 28409a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28419a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28429a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28439a88ca10SBarry Smith } 28449a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28459a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28469a88ca10SBarry Smith 28479a88ca10SBarry Smith k = 0; 28489a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28499a88ca10SBarry Smith n = isz; 28509a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28519a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28529a88ca10SBarry Smith row = bs * nidx[k] + ll; 28539a88ca10SBarry Smith start = ai[row]; 28549a88ca10SBarry Smith end = ai[row + 1]; 28559a88ca10SBarry Smith for (l = start; l < end; l++) { 28569a88ca10SBarry Smith val = aj[l] / bs; 28579a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28589a88ca10SBarry Smith } 28599a88ca10SBarry Smith } 28609a88ca10SBarry Smith } 28619a88ca10SBarry Smith } 28629a88ca10SBarry Smith PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i))); 28639a88ca10SBarry Smith } else { 2864dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2865e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28662205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28674dcbc457SBarry Smith } 28689566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28699566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2870e4d965acSSatish Balay 287104a348a9SBarry Smith k = 0; 287204a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 287304a348a9SBarry Smith n = isz; 287406763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2875e4d965acSSatish Balay row = nidx[k]; 2876e4d965acSSatish Balay start = ai[row]; 2877e4d965acSSatish Balay end = ai[row + 1]; 287804a348a9SBarry Smith for (l = start; l < end; l++) { 2879efb16452SHong Zhang val = aj[l]; 28802205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2881e4d965acSSatish Balay } 2882e4d965acSSatish Balay } 2883e4d965acSSatish Balay } 28849566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2885e4d965acSSatish Balay } 28869a88ca10SBarry Smith } 28879566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28889566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28893a40ed3dSBarry Smith PetscFunctionReturn(0); 28904dcbc457SBarry Smith } 289117ab2063SBarry Smith 28920513a670SBarry Smith /* -------------------------------------------------------------- */ 2893d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2894d71ae5a4SJacob Faibussowitsch { 28950513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28963b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 28975d0c19d7SBarry Smith const PetscInt *row, *col; 28985d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 289956cd22aeSBarry Smith IS icolp, irowp; 29000298fd71SBarry Smith PetscInt *cwork = NULL; 29010298fd71SBarry Smith PetscScalar *vwork = NULL; 29020513a670SBarry Smith 29033a40ed3dSBarry Smith PetscFunctionBegin; 29049566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29059566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29069566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29079566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29080513a670SBarry Smith 29090513a670SBarry Smith /* determine lengths of permuted rows */ 29109566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29112205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29129566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29139566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29149566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29159566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29179566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29180513a670SBarry Smith 29199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29200513a670SBarry Smith for (i = 0; i < m; i++) { 29219566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29222205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29239566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29249566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29250513a670SBarry Smith } 29269566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29272205254eSKarl Rupp 29283c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29292205254eSKarl Rupp 29308c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29319566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29329fe5e383SStefano Zampini #endif 29339566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29349566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29359566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29369566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29379566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29389566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 293948a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29403a40ed3dSBarry Smith PetscFunctionReturn(0); 29410513a670SBarry Smith } 29420513a670SBarry Smith 2943d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2944d71ae5a4SJacob Faibussowitsch { 2945cb5b572fSBarry Smith PetscFunctionBegin; 294633f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 294733f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2948be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2949be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29502e5835c6SStefano Zampini const PetscScalar *aa; 2951be6bf707SBarry Smith 29529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 295308401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29549566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29559566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2957cb5b572fSBarry Smith } else { 29589566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2959cb5b572fSBarry Smith } 2960cb5b572fSBarry Smith PetscFunctionReturn(0); 2961cb5b572fSBarry Smith } 2962cb5b572fSBarry Smith 2963d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetUp_SeqAIJ(Mat A) 2964d71ae5a4SJacob Faibussowitsch { 2965273d9f13SBarry Smith PetscFunctionBegin; 29669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, PETSC_DEFAULT, NULL)); 2967273d9f13SBarry Smith PetscFunctionReturn(0); 2968273d9f13SBarry Smith } 2969273d9f13SBarry Smith 2970d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2971d71ae5a4SJacob Faibussowitsch { 29726c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29736e111a19SKarl Rupp 29746c0721eeSBarry Smith PetscFunctionBegin; 29756c0721eeSBarry Smith *array = a->a; 29766c0721eeSBarry Smith PetscFunctionReturn(0); 29776c0721eeSBarry Smith } 29786c0721eeSBarry Smith 2979d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2980d71ae5a4SJacob Faibussowitsch { 29816c0721eeSBarry Smith PetscFunctionBegin; 2982f38c1e66SStefano Zampini *array = NULL; 29836c0721eeSBarry Smith PetscFunctionReturn(0); 29846c0721eeSBarry Smith } 2985273d9f13SBarry Smith 29868229c054SShri Abhyankar /* 29878229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29888229c054SShri Abhyankar have different nonzero structure. 29898229c054SShri Abhyankar */ 2990d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2991d71ae5a4SJacob Faibussowitsch { 2992b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2993ec7775f6SShri Abhyankar 2994ec7775f6SShri Abhyankar PetscFunctionBegin; 2995ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2996ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 2997b264fe52SHong Zhang const PetscInt *xjj = xj + xi[i], *yjj = yj + yi[i]; 2998b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 2999b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 30008af7cee1SJed Brown nnz[i] = 0; 30018af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 3002b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 3003b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 30048af7cee1SJed Brown nnz[i]++; 30058af7cee1SJed Brown } 30068af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 3007ec7775f6SShri Abhyankar } 3008ec7775f6SShri Abhyankar PetscFunctionReturn(0); 3009ec7775f6SShri Abhyankar } 3010ec7775f6SShri Abhyankar 3011d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3012d71ae5a4SJacob Faibussowitsch { 3013b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3014b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3015b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3016b264fe52SHong Zhang 3017b264fe52SHong Zhang PetscFunctionBegin; 3018b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30199566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 3020b264fe52SHong Zhang PetscFunctionReturn(0); 3021b264fe52SHong Zhang } 3022b264fe52SHong Zhang 3023d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3024d71ae5a4SJacob Faibussowitsch { 3025ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3026ac90fabeSBarry Smith 3027ac90fabeSBarry Smith PetscFunctionBegin; 3028134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3029134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3030134adf20SPierre Jolivet if (e) { 30319566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 303281fa06acSBarry Smith if (e) { 30339566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3034134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 303581fa06acSBarry Smith } 303681fa06acSBarry Smith } 303754c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 303881fa06acSBarry Smith } 3039ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30402e5835c6SStefano Zampini const PetscScalar *xa; 30412e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 304281fa06acSBarry Smith PetscBLASInt one = 1, bnz; 304381fa06acSBarry Smith 30449566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3047792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30509566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30529566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3053ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30549566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3055ac90fabeSBarry Smith } else { 30568229c054SShri Abhyankar Mat B; 30578229c054SShri Abhyankar PetscInt *nnz; 30589566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30599566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30609566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30619566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30629566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30639566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30659566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30669566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30679bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30689566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3069ac90fabeSBarry Smith } 3070ac90fabeSBarry Smith PetscFunctionReturn(0); 3071ac90fabeSBarry Smith } 3072ac90fabeSBarry Smith 3073d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3074d71ae5a4SJacob Faibussowitsch { 3075354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3076354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3077354c94deSBarry Smith PetscInt i, nz; 3078354c94deSBarry Smith PetscScalar *a; 3079354c94deSBarry Smith 3080354c94deSBarry Smith PetscFunctionBegin; 3081354c94deSBarry Smith nz = aij->nz; 30829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30832205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3085354c94deSBarry Smith #else 3086354c94deSBarry Smith PetscFunctionBegin; 3087354c94deSBarry Smith #endif 3088354c94deSBarry Smith PetscFunctionReturn(0); 3089354c94deSBarry Smith } 3090354c94deSBarry Smith 3091d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3092d71ae5a4SJacob Faibussowitsch { 3093e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3094d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3095e34fafa9SBarry Smith PetscReal atmp; 3096985db425SBarry Smith PetscScalar *x; 3097ce496241SStefano Zampini const MatScalar *aa, *av; 3098e34fafa9SBarry Smith 3099e34fafa9SBarry Smith PetscFunctionBegin; 310028b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3102ce496241SStefano Zampini aa = av; 3103e34fafa9SBarry Smith ai = a->i; 3104e34fafa9SBarry Smith aj = a->j; 3105e34fafa9SBarry Smith 31069566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31079566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31089566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 310908401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3110e34fafa9SBarry Smith for (i = 0; i < m; i++) { 31119371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31129371c9d4SSatish Balay ai++; 3113e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3114985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31159371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31169371c9d4SSatish Balay x[i] = atmp; 31179371c9d4SSatish Balay if (idx) idx[i] = *aj; 31189371c9d4SSatish Balay } 31199371c9d4SSatish Balay aa++; 31209371c9d4SSatish Balay aj++; 3121985db425SBarry Smith } 3122985db425SBarry Smith } 31239566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3125985db425SBarry Smith PetscFunctionReturn(0); 3126985db425SBarry Smith } 3127985db425SBarry Smith 3128d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3129d71ae5a4SJacob Faibussowitsch { 3130985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3131d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3132985db425SBarry Smith PetscScalar *x; 3133ce496241SStefano Zampini const MatScalar *aa, *av; 3134985db425SBarry Smith 3135985db425SBarry Smith PetscFunctionBegin; 313628b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3138ce496241SStefano Zampini aa = av; 3139985db425SBarry Smith ai = a->i; 3140985db425SBarry Smith aj = a->j; 3141985db425SBarry Smith 31429566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31439566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31449566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 314508401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3146985db425SBarry Smith for (i = 0; i < m; i++) { 31479371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31489371c9d4SSatish Balay ai++; 3149d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31509371c9d4SSatish Balay x[i] = *aa; 31519371c9d4SSatish Balay if (idx) idx[i] = 0; 3152985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3153985db425SBarry Smith x[i] = 0.0; 3154985db425SBarry Smith if (idx) { 3155985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3156985db425SBarry Smith if (aj[j] > j) { 3157985db425SBarry Smith idx[i] = j; 3158985db425SBarry Smith break; 3159985db425SBarry Smith } 3160985db425SBarry Smith } 31611a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31621a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3163985db425SBarry Smith } 3164985db425SBarry Smith } 3165985db425SBarry Smith for (j = 0; j < ncols; j++) { 31669371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31679371c9d4SSatish Balay x[i] = *aa; 31689371c9d4SSatish Balay if (idx) idx[i] = *aj; 31699371c9d4SSatish Balay } 31709371c9d4SSatish Balay aa++; 31719371c9d4SSatish Balay aj++; 3172985db425SBarry Smith } 3173985db425SBarry Smith } 31749566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3176985db425SBarry Smith PetscFunctionReturn(0); 3177985db425SBarry Smith } 3178985db425SBarry Smith 3179d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3180d71ae5a4SJacob Faibussowitsch { 3181c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3182c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3183ce496241SStefano Zampini PetscScalar *x; 3184ce496241SStefano Zampini const MatScalar *aa, *av; 3185c87e5d42SMatthew Knepley 3186c87e5d42SMatthew Knepley PetscFunctionBegin; 31879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3188ce496241SStefano Zampini aa = av; 3189c87e5d42SMatthew Knepley ai = a->i; 3190c87e5d42SMatthew Knepley aj = a->j; 3191c87e5d42SMatthew Knepley 31929566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31939566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31949566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 319508401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3196c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 31979371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31989371c9d4SSatish Balay ai++; 3199f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32009371c9d4SSatish Balay x[i] = *aa; 32019371c9d4SSatish Balay if (idx) idx[i] = 0; 3202f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3203f07e67edSHong Zhang x[i] = 0.0; 3204f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3205289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3206f07e67edSHong Zhang if (aj[j] > j) { 3207f07e67edSHong Zhang idx[i] = j; 32082205254eSKarl Rupp break; 32092205254eSKarl Rupp } 3210289a08f5SMatthew Knepley } 3211f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3212f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3213f07e67edSHong Zhang } 3214289a08f5SMatthew Knepley } 3215c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32169371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32179371c9d4SSatish Balay x[i] = *aa; 32189371c9d4SSatish Balay if (idx) idx[i] = *aj; 32199371c9d4SSatish Balay } 32209371c9d4SSatish Balay aa++; 32219371c9d4SSatish Balay aj++; 3222c87e5d42SMatthew Knepley } 3223c87e5d42SMatthew Knepley } 32249566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3226c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3227c87e5d42SMatthew Knepley } 3228c87e5d42SMatthew Knepley 3229d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3230d71ae5a4SJacob Faibussowitsch { 3231985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3232d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3233d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3234985db425SBarry Smith PetscScalar *x; 3235ce496241SStefano Zampini const MatScalar *aa, *av; 3236985db425SBarry Smith 3237985db425SBarry Smith PetscFunctionBegin; 323828b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3240ce496241SStefano Zampini aa = av; 3241985db425SBarry Smith ai = a->i; 3242985db425SBarry Smith aj = a->j; 3243985db425SBarry Smith 32449566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32459566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32469566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 324708401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3248985db425SBarry Smith for (i = 0; i < m; i++) { 32499371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32509371c9d4SSatish Balay ai++; 3251d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32529371c9d4SSatish Balay x[i] = *aa; 32539371c9d4SSatish Balay if (idx) idx[i] = 0; 3254985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3255985db425SBarry Smith x[i] = 0.0; 3256985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3257985db425SBarry Smith for (j = 0; j < ncols; j++) { 3258985db425SBarry Smith if (aj[j] > j) { 3259985db425SBarry Smith idx[i] = j; 3260985db425SBarry Smith break; 3261985db425SBarry Smith } 3262985db425SBarry Smith } 3263fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3264fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3265985db425SBarry Smith } 3266985db425SBarry Smith } 3267985db425SBarry Smith for (j = 0; j < ncols; j++) { 32689371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32699371c9d4SSatish Balay x[i] = *aa; 32709371c9d4SSatish Balay if (idx) idx[i] = *aj; 32719371c9d4SSatish Balay } 32729371c9d4SSatish Balay aa++; 32739371c9d4SSatish Balay aj++; 3274e34fafa9SBarry Smith } 3275e34fafa9SBarry Smith } 32769566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3278e34fafa9SBarry Smith PetscFunctionReturn(0); 3279e34fafa9SBarry Smith } 3280bbead8a2SBarry Smith 3281d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3282d71ae5a4SJacob Faibussowitsch { 3283bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 328433d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3285bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 32860da83c2eSBarry Smith const PetscReal shift = 0.0; 32871a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3288bbead8a2SBarry Smith 3289bbead8a2SBarry Smith PetscFunctionBegin; 3290a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 32914a0d0026SBarry Smith if (a->ibdiagvalid) { 32924a0d0026SBarry Smith if (values) *values = a->ibdiag; 32934a0d0026SBarry Smith PetscFunctionReturn(0); 32944a0d0026SBarry Smith } 32959566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 32964dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3297bbead8a2SBarry Smith diag = a->ibdiag; 3298bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3299bbead8a2SBarry Smith /* factor and invert each block */ 3300bbead8a2SBarry Smith switch (bs) { 3301bbead8a2SBarry Smith case 1: 3302bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33039566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3304ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3305ec1892c8SHong Zhang if (allowzeropivot) { 33067b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33077b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33087b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33099566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 331098921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3311ec1892c8SHong Zhang } 3312bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3313bbead8a2SBarry Smith } 3314bbead8a2SBarry Smith break; 3315bbead8a2SBarry Smith case 2: 3316bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33179371c9d4SSatish Balay ij[0] = 2 * i; 33189371c9d4SSatish Balay ij[1] = 2 * i + 1; 33199566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33209566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33217b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33229566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3323bbead8a2SBarry Smith diag += 4; 3324bbead8a2SBarry Smith } 3325bbead8a2SBarry Smith break; 3326bbead8a2SBarry Smith case 3: 3327bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33289371c9d4SSatish Balay ij[0] = 3 * i; 33299371c9d4SSatish Balay ij[1] = 3 * i + 1; 33309371c9d4SSatish Balay ij[2] = 3 * i + 2; 33319566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33329566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33337b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33349566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3335bbead8a2SBarry Smith diag += 9; 3336bbead8a2SBarry Smith } 3337bbead8a2SBarry Smith break; 3338bbead8a2SBarry Smith case 4: 3339bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33409371c9d4SSatish Balay ij[0] = 4 * i; 33419371c9d4SSatish Balay ij[1] = 4 * i + 1; 33429371c9d4SSatish Balay ij[2] = 4 * i + 2; 33439371c9d4SSatish Balay ij[3] = 4 * i + 3; 33449566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33459566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33467b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3348bbead8a2SBarry Smith diag += 16; 3349bbead8a2SBarry Smith } 3350bbead8a2SBarry Smith break; 3351bbead8a2SBarry Smith case 5: 3352bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33539371c9d4SSatish Balay ij[0] = 5 * i; 33549371c9d4SSatish Balay ij[1] = 5 * i + 1; 33559371c9d4SSatish Balay ij[2] = 5 * i + 2; 33569371c9d4SSatish Balay ij[3] = 5 * i + 3; 33579371c9d4SSatish Balay ij[4] = 5 * i + 4; 33589566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33599566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33607b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33619566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3362bbead8a2SBarry Smith diag += 25; 3363bbead8a2SBarry Smith } 3364bbead8a2SBarry Smith break; 3365bbead8a2SBarry Smith case 6: 3366bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33679371c9d4SSatish Balay ij[0] = 6 * i; 33689371c9d4SSatish Balay ij[1] = 6 * i + 1; 33699371c9d4SSatish Balay ij[2] = 6 * i + 2; 33709371c9d4SSatish Balay ij[3] = 6 * i + 3; 33719371c9d4SSatish Balay ij[4] = 6 * i + 4; 33729371c9d4SSatish Balay ij[5] = 6 * i + 5; 33739566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33749566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33757b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33769566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3377bbead8a2SBarry Smith diag += 36; 3378bbead8a2SBarry Smith } 3379bbead8a2SBarry Smith break; 3380bbead8a2SBarry Smith case 7: 3381bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33829371c9d4SSatish Balay ij[0] = 7 * i; 33839371c9d4SSatish Balay ij[1] = 7 * i + 1; 33849371c9d4SSatish Balay ij[2] = 7 * i + 2; 33859371c9d4SSatish Balay ij[3] = 7 * i + 3; 33869371c9d4SSatish Balay ij[4] = 7 * i + 4; 33879371c9d4SSatish Balay ij[5] = 7 * i + 5; 33889371c9d4SSatish Balay ij[5] = 7 * i + 6; 33899566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 33909566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 33917b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33929566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3393bbead8a2SBarry Smith diag += 49; 3394bbead8a2SBarry Smith } 3395bbead8a2SBarry Smith break; 3396bbead8a2SBarry Smith default: 33979566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3398bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3399ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34009566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34019566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34027b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34039566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3404bbead8a2SBarry Smith diag += bs2; 3405bbead8a2SBarry Smith } 34069566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3407bbead8a2SBarry Smith } 3408bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3409bbead8a2SBarry Smith PetscFunctionReturn(0); 3410bbead8a2SBarry Smith } 3411bbead8a2SBarry Smith 3412d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3413d71ae5a4SJacob Faibussowitsch { 341473a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3415fff043a9SJunchao Zhang PetscScalar a, *aa; 341673a71a0fSBarry Smith PetscInt m, n, i, j, col; 341773a71a0fSBarry Smith 341873a71a0fSBarry Smith PetscFunctionBegin; 341973a71a0fSBarry Smith if (!x->assembled) { 34209566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 342173a71a0fSBarry Smith for (i = 0; i < m; i++) { 342273a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34239566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 342473a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34259566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 342673a71a0fSBarry Smith } 342773a71a0fSBarry Smith } 3428e2ce353bSJunchao Zhang } else { 34299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34309566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3432e2ce353bSJunchao Zhang } 34339566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34349566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 343573a71a0fSBarry Smith PetscFunctionReturn(0); 343673a71a0fSBarry Smith } 343773a71a0fSBarry Smith 3438679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3439d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3440d71ae5a4SJacob Faibussowitsch { 3441679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3442679944adSJunchao Zhang PetscScalar a; 3443679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3444679944adSJunchao Zhang 3445679944adSJunchao Zhang PetscFunctionBegin; 3446679944adSJunchao Zhang nskip = high - low; 34479566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3448679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3449679944adSJunchao Zhang for (i = 0; i < m; i++) { 3450679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34519566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3452679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3453679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34549566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3455679944adSJunchao Zhang } 3456e2ce353bSJunchao Zhang } 34579566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34589566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 3459679944adSJunchao Zhang PetscFunctionReturn(0); 3460679944adSJunchao Zhang } 3461679944adSJunchao Zhang 3462682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 34630a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3464cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3465cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3466cb5b572fSBarry Smith MatMult_SeqAIJ, 346797304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34687c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34697c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3470f4259b30SLisandro Dalcin NULL, 3471f4259b30SLisandro Dalcin NULL, 3472f4259b30SLisandro Dalcin NULL, 3473f4259b30SLisandro Dalcin /* 10*/ NULL, 3474cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3475f4259b30SLisandro Dalcin NULL, 347641f059aeSBarry Smith MatSOR_SeqAIJ, 347791e9d3e2SHong Zhang MatTranspose_SeqAIJ, 347897304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3479cb5b572fSBarry Smith MatEqual_SeqAIJ, 3480cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3481cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3482cb5b572fSBarry Smith MatNorm_SeqAIJ, 3483f4259b30SLisandro Dalcin /* 20*/ NULL, 3484cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3485cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3486cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3487d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3488f4259b30SLisandro Dalcin NULL, 3489f4259b30SLisandro Dalcin NULL, 3490f4259b30SLisandro Dalcin NULL, 3491f4259b30SLisandro Dalcin NULL, 34924994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3493f4259b30SLisandro Dalcin NULL, 3494f4259b30SLisandro Dalcin NULL, 3495f4259b30SLisandro Dalcin NULL, 3496f4259b30SLisandro Dalcin NULL, 3497d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3498f4259b30SLisandro Dalcin NULL, 3499f4259b30SLisandro Dalcin NULL, 3500cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3501f4259b30SLisandro Dalcin NULL, 3502d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35037dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3504cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3505cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3506cb5b572fSBarry Smith MatCopy_SeqAIJ, 3507d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3508cb5b572fSBarry Smith MatScale_SeqAIJ, 35097d68702bSBarry Smith MatShift_SeqAIJ, 351079299369SBarry Smith MatDiagonalSet_SeqAIJ, 35116e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 351273a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35133b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35143b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35153b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3516a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 351793dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3518f4259b30SLisandro Dalcin NULL, 3519f4259b30SLisandro Dalcin NULL, 3520cda55fadSBarry Smith MatPermute_SeqAIJ, 3521f4259b30SLisandro Dalcin NULL, 3522f4259b30SLisandro Dalcin /* 59*/ NULL, 3523b9b97703SBarry Smith MatDestroy_SeqAIJ, 3524b9b97703SBarry Smith MatView_SeqAIJ, 3525f4259b30SLisandro Dalcin NULL, 3526f4259b30SLisandro Dalcin NULL, 3527f4259b30SLisandro Dalcin /* 64*/ NULL, 3528321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3529f4259b30SLisandro Dalcin NULL, 3530f4259b30SLisandro Dalcin NULL, 3531f4259b30SLisandro Dalcin NULL, 3532d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3533c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3534f4259b30SLisandro Dalcin NULL, 3535f4259b30SLisandro Dalcin NULL, 3536f4259b30SLisandro Dalcin NULL, 3537f4259b30SLisandro Dalcin /* 74*/ NULL, 35383acb8795SBarry Smith MatFDColoringApply_AIJ, 3539f4259b30SLisandro Dalcin NULL, 3540f4259b30SLisandro Dalcin NULL, 3541f4259b30SLisandro Dalcin NULL, 35426ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3543f4259b30SLisandro Dalcin NULL, 3544f4259b30SLisandro Dalcin NULL, 3545f4259b30SLisandro Dalcin NULL, 3546bc011b1eSHong Zhang MatLoad_SeqAIJ, 3547d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35481cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3549f4259b30SLisandro Dalcin NULL, 3550f4259b30SLisandro Dalcin NULL, 3551f4259b30SLisandro Dalcin NULL, 3552f4259b30SLisandro Dalcin /* 89*/ NULL, 3553f4259b30SLisandro Dalcin NULL, 355426be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3555f4259b30SLisandro Dalcin NULL, 3556f4259b30SLisandro Dalcin NULL, 35578fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3558f4259b30SLisandro Dalcin NULL, 3559f4259b30SLisandro Dalcin NULL, 35606fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3561f4259b30SLisandro Dalcin NULL, 35624222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3563f4259b30SLisandro Dalcin NULL, 3564f4259b30SLisandro Dalcin NULL, 356587d4246cSBarry Smith MatConjugate_SeqAIJ, 3566f4259b30SLisandro Dalcin NULL, 3567d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 356899cafbc1SBarry Smith MatRealPart_SeqAIJ, 3569f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3570f4259b30SLisandro Dalcin NULL, 3571f4259b30SLisandro Dalcin NULL, 3572cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3573f4259b30SLisandro Dalcin NULL, 35742af78befSBarry Smith MatGetRowMin_SeqAIJ, 3575f4259b30SLisandro Dalcin NULL, 3576599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3577f4259b30SLisandro Dalcin /*114*/ NULL, 3578f4259b30SLisandro Dalcin NULL, 3579f4259b30SLisandro Dalcin NULL, 3580f4259b30SLisandro Dalcin NULL, 3581f4259b30SLisandro Dalcin NULL, 3582f4259b30SLisandro Dalcin /*119*/ NULL, 3583f4259b30SLisandro Dalcin NULL, 3584f4259b30SLisandro Dalcin NULL, 3585f4259b30SLisandro Dalcin NULL, 3586b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 35870716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3588a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 358937868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 35900da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3591f4259b30SLisandro Dalcin NULL, 3592f4259b30SLisandro Dalcin /*129*/ NULL, 3593f4259b30SLisandro Dalcin NULL, 3594f4259b30SLisandro Dalcin NULL, 359575648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3596b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3597b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 35982b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3599f4259b30SLisandro Dalcin NULL, 3600f4259b30SLisandro Dalcin NULL, 36013964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3602f4259b30SLisandro Dalcin /*139*/ NULL, 3603f4259b30SLisandro Dalcin NULL, 3604f4259b30SLisandro Dalcin NULL, 36053a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36069c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36074222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36084222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3609f4259b30SLisandro Dalcin NULL, 361072833a62Smarkadams4 NULL, 361172833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36122d776b49SBarry Smith NULL, 36139371c9d4SSatish Balay /*150*/ MatTransposeSymbolic_SeqAIJ}; 361417ab2063SBarry Smith 3615d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3616d71ae5a4SJacob Faibussowitsch { 3617bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 361897f1f81fSBarry Smith PetscInt i, nz, n; 3619bef8e0ddSBarry Smith 3620bef8e0ddSBarry Smith PetscFunctionBegin; 3621bef8e0ddSBarry Smith nz = aij->maxnz; 3622d0f46423SBarry Smith n = mat->rmap->n; 3623ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3624bef8e0ddSBarry Smith aij->nz = nz; 3625ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 3626bef8e0ddSBarry Smith PetscFunctionReturn(0); 3627bef8e0ddSBarry Smith } 3628bef8e0ddSBarry Smith 3629a3bb6f32SFande Kong /* 3630ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3631ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3632ddea5d60SJunchao Zhang */ 3633d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3634d71ae5a4SJacob Faibussowitsch { 3635a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3636a3bb6f32SFande Kong PetscTable gid1_lid1; 3637a3bb6f32SFande Kong PetscTablePosition tpos; 363825b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 363925b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3640a3bb6f32SFande Kong 3641a3bb6f32SFande Kong PetscFunctionBegin; 3642a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3643a3bb6f32SFande Kong PetscValidPointer(mapping, 2); 3644a3bb6f32SFande Kong /* use a table */ 36459566063dSJacob Faibussowitsch PetscCall(PetscTableCreate(mat->rmap->n, mat->cmap->N + 1, &gid1_lid1)); 3646a3bb6f32SFande Kong ec = 0; 364725b670f0SStefano Zampini for (i = 0; i < nz; i++) { 364825b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 36499566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1, gid1, &data)); 3650a3bb6f32SFande Kong if (!data) { 3651a3bb6f32SFande Kong /* one based table */ 36529566063dSJacob Faibussowitsch PetscCall(PetscTableAdd(gid1_lid1, gid1, ++ec, INSERT_VALUES)); 3653a3bb6f32SFande Kong } 3654a3bb6f32SFande Kong } 3655a3bb6f32SFande Kong /* form array of columns we need */ 36569566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 36579566063dSJacob Faibussowitsch PetscCall(PetscTableGetHeadPosition(gid1_lid1, &tpos)); 3658a3bb6f32SFande Kong while (tpos) { 36599566063dSJacob Faibussowitsch PetscCall(PetscTableGetNext(gid1_lid1, &tpos, &gid, &lid)); 3660a3bb6f32SFande Kong gid--; 3661a3bb6f32SFande Kong lid--; 3662a3bb6f32SFande Kong garray[lid] = gid; 3663a3bb6f32SFande Kong } 36649566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 36659566063dSJacob Faibussowitsch PetscCall(PetscTableRemoveAll(gid1_lid1)); 366648a46eb9SPierre Jolivet for (i = 0; i < ec; i++) PetscCall(PetscTableAdd(gid1_lid1, garray[i] + 1, i + 1, INSERT_VALUES)); 3667a3bb6f32SFande Kong /* compact out the extra columns in B */ 366825b670f0SStefano Zampini for (i = 0; i < nz; i++) { 366925b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 36709566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1, gid1, &lid)); 3671a3bb6f32SFande Kong lid--; 367225b670f0SStefano Zampini jj[i] = lid; 3673a3bb6f32SFande Kong } 36749566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 36759566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy(&gid1_lid1)); 36769566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36779566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36789566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 3679a3bb6f32SFande Kong PetscFunctionReturn(0); 3680a3bb6f32SFande Kong } 3681a3bb6f32SFande Kong 3682bef8e0ddSBarry Smith /*@ 3683bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3684bef8e0ddSBarry Smith in the matrix. 3685bef8e0ddSBarry Smith 3686bef8e0ddSBarry Smith Input Parameters: 368711a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3688bef8e0ddSBarry Smith - indices - the column indices 3689bef8e0ddSBarry Smith 369015091d37SBarry Smith Level: advanced 369115091d37SBarry Smith 3692bef8e0ddSBarry Smith Notes: 3693bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3694bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 369511a5261eSBarry Smith of the `MatSetValues()` operation. 3696bef8e0ddSBarry Smith 3697bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 369811a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3699bef8e0ddSBarry Smith 370011a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3701bef8e0ddSBarry Smith 3702b9617806SBarry Smith The indices should start with zero, not one. 3703b9617806SBarry Smith 3704bef8e0ddSBarry Smith @*/ 3705d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3706d71ae5a4SJacob Faibussowitsch { 3707bef8e0ddSBarry Smith PetscFunctionBegin; 37080700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3709dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 3710cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 3711bef8e0ddSBarry Smith PetscFunctionReturn(0); 3712bef8e0ddSBarry Smith } 3713bef8e0ddSBarry Smith 3714be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3715be6bf707SBarry Smith 3716d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3717d71ae5a4SJacob Faibussowitsch { 3718be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3719d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3720be6bf707SBarry Smith 3721be6bf707SBarry Smith PetscFunctionBegin; 372228b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3723be6bf707SBarry Smith 3724be6bf707SBarry Smith /* allocate space for values if not already there */ 37254dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3726be6bf707SBarry Smith 3727be6bf707SBarry Smith /* copy values over */ 37289566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 3729be6bf707SBarry Smith PetscFunctionReturn(0); 3730be6bf707SBarry Smith } 3731be6bf707SBarry Smith 3732be6bf707SBarry Smith /*@ 3733be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3734be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3735be6bf707SBarry Smith nonlinear portion. 3736be6bf707SBarry Smith 3737c3339decSBarry Smith Logically Collect 3738be6bf707SBarry Smith 3739be6bf707SBarry Smith Input Parameters: 374011a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3741be6bf707SBarry Smith 374215091d37SBarry Smith Level: advanced 374315091d37SBarry Smith 374411a5261eSBarry Smith Common Usage, with `SNESSolve()`: 3745be6bf707SBarry Smith $ Create Jacobian matrix 3746be6bf707SBarry Smith $ Set linear terms into matrix 3747be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3748be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3749be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3750512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3751be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3752be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3753be6bf707SBarry Smith $ In your Jacobian routine 3754be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3755be6bf707SBarry Smith $ Set nonlinear terms in matrix 3756be6bf707SBarry Smith 3757be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3758be6bf707SBarry Smith $ // build linear portion of Jacobian 3759512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3760be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3761be6bf707SBarry Smith $ loop over nonlinear iterations 3762be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3763be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3764be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3765be6bf707SBarry Smith $ Solve linear system with Jacobian 3766be6bf707SBarry Smith $ endloop 3767be6bf707SBarry Smith 3768be6bf707SBarry Smith Notes: 3769be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 377011a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3771be6bf707SBarry Smith calling this routine. 3772be6bf707SBarry Smith 37730c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37740c468ba9SBarry Smith and does not allocated additional space. 37750c468ba9SBarry Smith 3776db781477SPatrick Sanan .seealso: `MatRetrieveValues()` 3777be6bf707SBarry Smith @*/ 3778d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3779d71ae5a4SJacob Faibussowitsch { 3780be6bf707SBarry Smith PetscFunctionBegin; 37810700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 378228b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 378328b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3784cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 3785be6bf707SBarry Smith PetscFunctionReturn(0); 3786be6bf707SBarry Smith } 3787be6bf707SBarry Smith 3788d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3789d71ae5a4SJacob Faibussowitsch { 3790be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3791d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3792be6bf707SBarry Smith 3793be6bf707SBarry Smith PetscFunctionBegin; 379428b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 379528b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3796be6bf707SBarry Smith /* copy values over */ 37979566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 3798be6bf707SBarry Smith PetscFunctionReturn(0); 3799be6bf707SBarry Smith } 3800be6bf707SBarry Smith 3801be6bf707SBarry Smith /*@ 3802be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3803be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3804be6bf707SBarry Smith nonlinear portion. 3805be6bf707SBarry Smith 3806c3339decSBarry Smith Logically Collect 3807be6bf707SBarry Smith 3808be6bf707SBarry Smith Input Parameters: 380911a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3810be6bf707SBarry Smith 381115091d37SBarry Smith Level: advanced 381215091d37SBarry Smith 3813db781477SPatrick Sanan .seealso: `MatStoreValues()` 3814be6bf707SBarry Smith @*/ 3815d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3816d71ae5a4SJacob Faibussowitsch { 3817be6bf707SBarry Smith PetscFunctionBegin; 38180700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 381928b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 382028b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3821cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 3822be6bf707SBarry Smith PetscFunctionReturn(0); 3823be6bf707SBarry Smith } 3824be6bf707SBarry Smith 3825be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 382617ab2063SBarry Smith /*@C 382711a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38280d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 38296e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 383051c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 38312bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 383217ab2063SBarry Smith 3833d083f849SBarry Smith Collective 3834db81eaa0SLois Curfman McInnes 383517ab2063SBarry Smith Input Parameters: 383611a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 383717ab2063SBarry Smith . m - number of rows 383817ab2063SBarry Smith . n - number of columns 383917ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 384051c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38410298fd71SBarry Smith (possibly different for each row) or NULL 384217ab2063SBarry Smith 384317ab2063SBarry Smith Output Parameter: 3844416022c9SBarry Smith . A - the matrix 384517ab2063SBarry Smith 384611a5261eSBarry Smith It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 3847f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 384811a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 3849175b88e8SBarry Smith 3850b259b22eSLois Curfman McInnes Notes: 385149a6f317SBarry Smith If nnz is given then nz is ignored 385249a6f317SBarry Smith 385311a5261eSBarry Smith The AIJ format, also called 385411a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 38550002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 385644cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 385717ab2063SBarry Smith 385817ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 385911a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 38603d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 38616da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 386217ab2063SBarry Smith 3863682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38644fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3865682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38666c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38676c7ebb05SLois Curfman McInnes 38686c7ebb05SLois Curfman McInnes Options Database Keys: 3869698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 38709db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 387117ab2063SBarry Smith 3872027ccd11SLois Curfman McInnes Level: intermediate 3873027ccd11SLois Curfman McInnes 387460161072SBarry Smith .seealso: [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 387517ab2063SBarry Smith @*/ 3876d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3877d71ae5a4SJacob Faibussowitsch { 38783a40ed3dSBarry Smith PetscFunctionBegin; 38799566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38809566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38819566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 3883273d9f13SBarry Smith PetscFunctionReturn(0); 3884273d9f13SBarry Smith } 3885273d9f13SBarry Smith 3886273d9f13SBarry Smith /*@C 3887273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3888273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3889273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3890273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3891273d9f13SBarry Smith 3892d083f849SBarry Smith Collective 3893273d9f13SBarry Smith 3894273d9f13SBarry Smith Input Parameters: 38951c4f3114SJed Brown + B - The matrix 3896273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3897273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38980298fd71SBarry Smith (possibly different for each row) or NULL 3899273d9f13SBarry Smith 3900273d9f13SBarry Smith Notes: 390149a6f317SBarry Smith If nnz is given then nz is ignored 390249a6f317SBarry Smith 390311a5261eSBarry Smith The `MATSEQAIJ` format also called 390411a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 3905273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3906273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3907273d9f13SBarry Smith 3908273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 390911a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 3910273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3911273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3912273d9f13SBarry Smith 391311a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3914aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3915aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3916aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3917aa95bbe8SBarry Smith 391811a5261eSBarry Smith Developer Notes: 391911a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3920a96a251dSBarry Smith entries or columns indices 3921a96a251dSBarry Smith 3922273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3923273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3924273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3925273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3926273d9f13SBarry Smith 3927273d9f13SBarry Smith Options Database Keys: 3928698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 392947b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3930273d9f13SBarry Smith 3931273d9f13SBarry Smith Level: intermediate 3932273d9f13SBarry Smith 3933db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3934db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3935273d9f13SBarry Smith @*/ 3936d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3937d71ae5a4SJacob Faibussowitsch { 3938a23d5eceSKris Buschelman PetscFunctionBegin; 39396ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39406ba663aaSJed Brown PetscValidType(B, 1); 3941cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 3942a23d5eceSKris Buschelman PetscFunctionReturn(0); 3943a23d5eceSKris Buschelman } 3944a23d5eceSKris Buschelman 3945d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3946d71ae5a4SJacob Faibussowitsch { 3947273d9f13SBarry Smith Mat_SeqAIJ *b; 39482576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 394997f1f81fSBarry Smith PetscInt i; 3950273d9f13SBarry Smith 3951273d9f13SBarry Smith PetscFunctionBegin; 39522576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3953a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3954c461c341SBarry Smith skipallocation = PETSC_TRUE; 3955c461c341SBarry Smith nz = 0; 3956c461c341SBarry Smith } 39579566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39589566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3959899cda47SBarry Smith 3960435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 396108401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 3962cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3963d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 396408401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 396508401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3966b73539f3SBarry Smith } 3967b73539f3SBarry Smith } 3968b73539f3SBarry Smith 3969273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 39702205254eSKarl Rupp 3971273d9f13SBarry Smith b = (Mat_SeqAIJ *)B->data; 3972273d9f13SBarry Smith 3973ab93d7beSBarry Smith if (!skipallocation) { 39744dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3975071fcb05SBarry Smith if (!b->ilen) { 3976071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39779566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3978071fcb05SBarry Smith } else { 39799566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39802ee49352SLisandro Dalcin } 39814dfa11a4SJacob Faibussowitsch if (!b->ipre) { PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); } 3982273d9f13SBarry Smith if (!nnz) { 3983435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3984c62bd62aSJed Brown else if (nz < 0) nz = 1; 39855d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 3986d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 3987d0f46423SBarry Smith nz = nz * B->rmap->n; 3988273d9f13SBarry Smith } else { 3989c73702f5SBarry Smith PetscInt64 nz64 = 0; 39909371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 39919371c9d4SSatish Balay b->imax[i] = nnz[i]; 39929371c9d4SSatish Balay nz64 += nnz[i]; 39939371c9d4SSatish Balay } 39949566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 3995273d9f13SBarry Smith } 3996ab93d7beSBarry Smith 3997273d9f13SBarry Smith /* allocate the matrix space */ 399853dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 39999566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 4000396832f4SHong Zhang if (B->structure_only) { 40019566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &b->j)); 40029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i)); 4003396832f4SHong Zhang } else { 40049566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i)); 4005396832f4SHong Zhang } 4006bfeeae90SHong Zhang b->i[0] = 0; 4007ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4008396832f4SHong Zhang if (B->structure_only) { 4009396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4010396832f4SHong Zhang b->free_a = PETSC_FALSE; 4011396832f4SHong Zhang } else { 4012273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4013e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4014396832f4SHong Zhang } 4015e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4016c461c341SBarry Smith } else { 4017e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4018e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4019c461c341SBarry Smith } 4020273d9f13SBarry Smith 4021846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4022846b4da1SFande Kong /* reserve user-requested sparsity */ 40239566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4024846b4da1SFande Kong } 4025846b4da1SFande Kong 4026273d9f13SBarry Smith b->nz = 0; 4027273d9f13SBarry Smith b->maxnz = nz; 4028273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40291baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4030cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4031cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40325519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40335519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40345519a089SJose E. Roman */ 40355519a089SJose E. Roman B->nonzerostate++; 4036273d9f13SBarry Smith PetscFunctionReturn(0); 4037273d9f13SBarry Smith } 4038273d9f13SBarry Smith 4039d71ae5a4SJacob Faibussowitsch PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4040d71ae5a4SJacob Faibussowitsch { 4041846b4da1SFande Kong Mat_SeqAIJ *a; 4042a5bbaf83SFande Kong PetscInt i; 4043846b4da1SFande Kong 4044846b4da1SFande Kong PetscFunctionBegin; 4045846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 404614d0e64fSAlex Lindsay 404714d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 404814d0e64fSAlex Lindsay if (!A->rmap->n) PetscFunctionReturn(0); 404914d0e64fSAlex Lindsay 4050846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40512c814fdeSFande Kong /* if no saved info, we error out */ 405228b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40532c814fdeSFande Kong 4054aed4548fSBarry Smith PetscCheck(a->i && a->j && a->a && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40552c814fdeSFande Kong 40569566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4058846b4da1SFande Kong a->i[0] = 0; 4059ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4060846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4061846b4da1SFande Kong a->nz = 0; 4062846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4063846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4064846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4065846b4da1SFande Kong A->assembled = PETSC_FALSE; 4066846b4da1SFande Kong PetscFunctionReturn(0); 4067846b4da1SFande Kong } 4068846b4da1SFande Kong 406958d36128SBarry Smith /*@ 407011a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4071a1661176SMatthew Knepley 4072a1661176SMatthew Knepley Input Parameters: 4073a1661176SMatthew Knepley + B - the matrix 4074a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4075a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4076a1661176SMatthew Knepley - v - optional values in the matrix 4077a1661176SMatthew Knepley 4078a1661176SMatthew Knepley Level: developer 4079a1661176SMatthew Knepley 40806a9b8d82SBarry Smith Notes: 408111a5261eSBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 408258d36128SBarry Smith 40836a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 40846a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 40856a9b8d82SBarry Smith 40866a9b8d82SBarry Smith Developer Notes: 40876a9b8d82SBarry Smith An optimization could be added to the implementation where it checks if the i, and j are identical to the current i and j and 408811a5261eSBarry Smith then just copies the v values directly with `PetscMemcpy()`. 40896a9b8d82SBarry Smith 409011a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 40916a9b8d82SBarry Smith 4092db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MatResetPreallocation()` 4093a1661176SMatthew Knepley @*/ 4094d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4095d71ae5a4SJacob Faibussowitsch { 4096a1661176SMatthew Knepley PetscFunctionBegin; 40970700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 40986ba663aaSJed Brown PetscValidType(B, 1); 4099cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 4100a1661176SMatthew Knepley PetscFunctionReturn(0); 4101a1661176SMatthew Knepley } 4102a1661176SMatthew Knepley 4103d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4104d71ae5a4SJacob Faibussowitsch { 4105a1661176SMatthew Knepley PetscInt i; 4106a1661176SMatthew Knepley PetscInt m, n; 4107a1661176SMatthew Knepley PetscInt nz; 41086a9b8d82SBarry Smith PetscInt *nnz; 4109a1661176SMatthew Knepley 4110a1661176SMatthew Knepley PetscFunctionBegin; 4111aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4112779a8d59SSatish Balay 41139566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41149566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4115779a8d59SSatish Balay 41169566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41179566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4118a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4119b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 412008401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4121a1661176SMatthew Knepley nnz[i] = nz; 4122a1661176SMatthew Knepley } 41239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41249566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4125a1661176SMatthew Knepley 412648a46eb9SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES)); 4127a1661176SMatthew Knepley 41289566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41299566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4130a1661176SMatthew Knepley 41319566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 4132a1661176SMatthew Knepley PetscFunctionReturn(0); 4133a1661176SMatthew Knepley } 4134a1661176SMatthew Knepley 4135ad7e164aSPierre Jolivet /*@ 4136ad7e164aSPierre Jolivet MatSeqAIJKron - Computes C, the Kronecker product of A and B. 4137ad7e164aSPierre Jolivet 4138ad7e164aSPierre Jolivet Input Parameters: 4139ad7e164aSPierre Jolivet + A - left-hand side matrix 4140ad7e164aSPierre Jolivet . B - right-hand side matrix 414111a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4142ad7e164aSPierre Jolivet 4143ad7e164aSPierre Jolivet Output Parameter: 4144ad7e164aSPierre Jolivet . C - Kronecker product of A and B 4145ad7e164aSPierre Jolivet 4146ad7e164aSPierre Jolivet Level: intermediate 4147ad7e164aSPierre Jolivet 414811a5261eSBarry Smith Note: 414911a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4150ad7e164aSPierre Jolivet 4151db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4152ad7e164aSPierre Jolivet @*/ 4153d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4154d71ae5a4SJacob Faibussowitsch { 4155ad7e164aSPierre Jolivet PetscFunctionBegin; 4156ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4157ad7e164aSPierre Jolivet PetscValidType(A, 1); 4158ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4159ad7e164aSPierre Jolivet PetscValidType(B, 2); 4160ad7e164aSPierre Jolivet PetscValidPointer(C, 4); 4161ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4162ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4163ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4164ad7e164aSPierre Jolivet } 4165cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 4166ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4167ad7e164aSPierre Jolivet } 4168ad7e164aSPierre Jolivet 4169d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4170d71ae5a4SJacob Faibussowitsch { 4171ad7e164aSPierre Jolivet Mat newmat; 4172ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4173ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4174ad7e164aSPierre Jolivet PetscScalar *v; 4175fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4176ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4177ad7e164aSPierre Jolivet PetscBool flg; 4178ad7e164aSPierre Jolivet 4179ad7e164aSPierre Jolivet PetscFunctionBegin; 418028b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 418128b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 418228b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 418328b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 41849566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 418528b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4186aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4187ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 41889566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 41899566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 41909566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 41919566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4192ad7e164aSPierre Jolivet i[0] = 0; 4193ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4194ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4195ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4196ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4197ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4198ad7e164aSPierre Jolivet } 4199ad7e164aSPierre Jolivet } 4200ad7e164aSPierre Jolivet } 42019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4202ad7e164aSPierre Jolivet *C = newmat; 42039566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4204ad7e164aSPierre Jolivet nnz = 0; 4205ad7e164aSPierre Jolivet } 42069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4209ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4210ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4211ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4212ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4213ad7e164aSPierre Jolivet } 4214ad7e164aSPierre Jolivet } 4215ad7e164aSPierre Jolivet } 42169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 4219ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4220ad7e164aSPierre Jolivet } 4221ad7e164aSPierre Jolivet 4222c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4223af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4224170fe5c8SBarry Smith 4225170fe5c8SBarry Smith /* 4226170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4227170fe5c8SBarry Smith 4228170fe5c8SBarry Smith n p p 42292da392ccSBarry Smith [ ] [ ] [ ] 42302da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42312da392ccSBarry Smith [ ] [ ] [ ] 4232170fe5c8SBarry Smith 4233170fe5c8SBarry Smith */ 4234d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4235d71ae5a4SJacob Faibussowitsch { 4236170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4237170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4238170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 423986214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4240170fe5c8SBarry Smith const PetscInt *ii, *idx; 4241170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4242170fe5c8SBarry Smith PetscScalar *c, *c_q; 424386214ceeSStefano Zampini PetscInt clda = sub_c->lda; 424486214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4245170fe5c8SBarry Smith 4246170fe5c8SBarry Smith PetscFunctionBegin; 4247d0f46423SBarry Smith m = A->rmap->n; 4248d0f46423SBarry Smith n = A->cmap->n; 4249d0f46423SBarry Smith p = B->cmap->n; 4250170fe5c8SBarry Smith a = sub_a->v; 4251170fe5c8SBarry Smith b = sub_b->a; 4252170fe5c8SBarry Smith c = sub_c->v; 425386214ceeSStefano Zampini if (clda == m) { 42549566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 425586214ceeSStefano Zampini } else { 425686214ceeSStefano Zampini for (j = 0; j < p; j++) 42579371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 425886214ceeSStefano Zampini } 4259170fe5c8SBarry Smith ii = sub_b->i; 4260170fe5c8SBarry Smith idx = sub_b->j; 4261170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4262170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4263170fe5c8SBarry Smith while (q-- > 0) { 426486214ceeSStefano Zampini c_q = c + clda * (*idx); 426586214ceeSStefano Zampini a_q = a + alda * i; 4266854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4267170fe5c8SBarry Smith idx++; 4268170fe5c8SBarry Smith b++; 4269170fe5c8SBarry Smith } 4270170fe5c8SBarry Smith } 4271170fe5c8SBarry Smith PetscFunctionReturn(0); 4272170fe5c8SBarry Smith } 4273170fe5c8SBarry Smith 4274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4275d71ae5a4SJacob Faibussowitsch { 4276d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 427786214ceeSStefano Zampini PetscBool cisdense; 4278170fe5c8SBarry Smith 4279170fe5c8SBarry Smith PetscFunctionBegin; 428008401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 42819566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 42829566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 42839566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, "")); 428448a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 42859566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4286d73949e8SHong Zhang 42874222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 4288170fe5c8SBarry Smith PetscFunctionReturn(0); 4289170fe5c8SBarry Smith } 4290170fe5c8SBarry Smith 4291170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 42920bad9183SKris Buschelman /*MC 4293fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 42940bad9183SKris Buschelman based on compressed sparse row format. 42950bad9183SKris Buschelman 42960bad9183SKris Buschelman Options Database Keys: 42970bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 42980bad9183SKris Buschelman 42990bad9183SKris Buschelman Level: beginner 43000bad9183SKris Buschelman 43010cd7f59aSBarry Smith Notes: 430211a5261eSBarry Smith `MatSetValues()` may be called for this matrix type with a NULL argument for the numerical values, 43030cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43040cd7f59aSBarry Smith in the matrix 43050cd7f59aSBarry Smith 430611a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 430711a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43080cd7f59aSBarry Smith 430911a5261eSBarry Smith Developer Note: 43100cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 43110cd7f59aSBarry Smith 4312db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43130bad9183SKris Buschelman M*/ 43140bad9183SKris Buschelman 4315ccd284c7SBarry Smith /*MC 4316ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4317ccd284c7SBarry Smith 431811a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 431911a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 432011a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4321ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4322ccd284c7SBarry Smith the above preallocation routines for simplicity. 4323ccd284c7SBarry Smith 4324ccd284c7SBarry Smith Options Database Keys: 432511a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4326ccd284c7SBarry Smith 432711a5261eSBarry Smith Note: 432811a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4329ccd284c7SBarry Smith enough exist. 4330ccd284c7SBarry Smith 4331ccd284c7SBarry Smith Level: beginner 4332ccd284c7SBarry Smith 4333db781477SPatrick Sanan .seealso: `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4334ccd284c7SBarry Smith M*/ 4335ccd284c7SBarry Smith 4336ccd284c7SBarry Smith /*MC 4337ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4338ccd284c7SBarry Smith 433911a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 434011a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 434111a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4342ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4343ccd284c7SBarry Smith the above preallocation routines for simplicity. 4344ccd284c7SBarry Smith 4345ccd284c7SBarry Smith Options Database Keys: 434611a5261eSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 4347ccd284c7SBarry Smith 4348ccd284c7SBarry Smith Level: beginner 4349ccd284c7SBarry Smith 4350c2e3fba1SPatrick Sanan .seealso: `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4351ccd284c7SBarry Smith M*/ 4352ccd284c7SBarry Smith 43537906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43547906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43557906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43567906f579SHong Zhang #endif 4357d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4358d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4359d24d4204SJose E. Roman #endif 43607906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43617906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43627906f579SHong Zhang #endif 43637906f579SHong Zhang 4364d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4365c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43664222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43677906f579SHong Zhang 43688c778c55SBarry Smith /*@C 436911a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43708c778c55SBarry Smith 43718c778c55SBarry Smith Not Collective 43728c778c55SBarry Smith 43738c778c55SBarry Smith Input Parameter: 437411a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 43758c778c55SBarry Smith 43768c778c55SBarry Smith Output Parameter: 43778c778c55SBarry Smith . array - pointer to the data 43788c778c55SBarry Smith 43798c778c55SBarry Smith Level: intermediate 43808c778c55SBarry Smith 4381db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 43828c778c55SBarry Smith @*/ 4383d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array) 4384d71ae5a4SJacob Faibussowitsch { 4385d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 43868c778c55SBarry Smith 43878c778c55SBarry Smith PetscFunctionBegin; 4388d67d9f35SJunchao Zhang if (aij->ops->getarray) { 43899566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4390d67d9f35SJunchao Zhang } else { 4391d67d9f35SJunchao Zhang *array = aij->a; 4392d67d9f35SJunchao Zhang } 4393d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4394d67d9f35SJunchao Zhang } 4395d67d9f35SJunchao Zhang 4396d67d9f35SJunchao Zhang /*@C 439711a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4398d67d9f35SJunchao Zhang 4399d67d9f35SJunchao Zhang Not Collective 4400d67d9f35SJunchao Zhang 4401d67d9f35SJunchao Zhang Input Parameters: 440211a5261eSBarry Smith + mat - a `MATSEQAIJ` matrix 4403d67d9f35SJunchao Zhang - array - pointer to the data 4404d67d9f35SJunchao Zhang 4405d67d9f35SJunchao Zhang Level: intermediate 4406d67d9f35SJunchao Zhang 4407db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4408d67d9f35SJunchao Zhang @*/ 4409d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array) 4410d71ae5a4SJacob Faibussowitsch { 4411d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4412d67d9f35SJunchao Zhang 4413d67d9f35SJunchao Zhang PetscFunctionBegin; 4414d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44159566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4416d67d9f35SJunchao Zhang } else { 4417d67d9f35SJunchao Zhang *array = NULL; 4418d67d9f35SJunchao Zhang } 44199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44209566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44218c778c55SBarry Smith PetscFunctionReturn(0); 44228c778c55SBarry Smith } 44238c778c55SBarry Smith 442421e72a00SBarry Smith /*@C 442511a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44268f1ea47aSStefano Zampini 44278f1ea47aSStefano Zampini Not Collective 44288f1ea47aSStefano Zampini 44298f1ea47aSStefano Zampini Input Parameter: 443011a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44318f1ea47aSStefano Zampini 44328f1ea47aSStefano Zampini Output Parameter: 44338f1ea47aSStefano Zampini . array - pointer to the data 44348f1ea47aSStefano Zampini 44358f1ea47aSStefano Zampini Level: intermediate 44368f1ea47aSStefano Zampini 4437db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44388f1ea47aSStefano Zampini @*/ 4439d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array) 4440d71ae5a4SJacob Faibussowitsch { 4441d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44428f1ea47aSStefano Zampini 44438f1ea47aSStefano Zampini PetscFunctionBegin; 4444d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44459566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4446d67d9f35SJunchao Zhang } else { 4447d67d9f35SJunchao Zhang *array = aij->a; 4448d67d9f35SJunchao Zhang } 44498f1ea47aSStefano Zampini PetscFunctionReturn(0); 44508f1ea47aSStefano Zampini } 44518f1ea47aSStefano Zampini 44528f1ea47aSStefano Zampini /*@C 445311a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44548f1ea47aSStefano Zampini 44558f1ea47aSStefano Zampini Not Collective 44568f1ea47aSStefano Zampini 44578f1ea47aSStefano Zampini Input Parameter: 445811a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44598f1ea47aSStefano Zampini 44608f1ea47aSStefano Zampini Output Parameter: 44618f1ea47aSStefano Zampini . array - pointer to the data 44628f1ea47aSStefano Zampini 44638f1ea47aSStefano Zampini Level: intermediate 44648f1ea47aSStefano Zampini 4465db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44668f1ea47aSStefano Zampini @*/ 4467d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array) 4468d71ae5a4SJacob Faibussowitsch { 4469d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44708f1ea47aSStefano Zampini 44718f1ea47aSStefano Zampini PetscFunctionBegin; 4472d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44739566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4474d67d9f35SJunchao Zhang } else { 4475d67d9f35SJunchao Zhang *array = NULL; 4476d67d9f35SJunchao Zhang } 4477d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4478d67d9f35SJunchao Zhang } 4479d67d9f35SJunchao Zhang 4480d67d9f35SJunchao Zhang /*@C 448111a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4482d67d9f35SJunchao Zhang 4483d67d9f35SJunchao Zhang Not Collective 4484d67d9f35SJunchao Zhang 4485d67d9f35SJunchao Zhang Input Parameter: 448611a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 4487d67d9f35SJunchao Zhang 4488d67d9f35SJunchao Zhang Output Parameter: 4489d67d9f35SJunchao Zhang . array - pointer to the data 4490d67d9f35SJunchao Zhang 4491d67d9f35SJunchao Zhang Level: intermediate 4492d67d9f35SJunchao Zhang 4493db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4494d67d9f35SJunchao Zhang @*/ 4495d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array) 4496d71ae5a4SJacob Faibussowitsch { 4497d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4498d67d9f35SJunchao Zhang 4499d67d9f35SJunchao Zhang PetscFunctionBegin; 4500d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45019566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4502d67d9f35SJunchao Zhang } else { 4503d67d9f35SJunchao Zhang *array = aij->a; 4504d67d9f35SJunchao Zhang } 45059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45069566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 4507d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4508d67d9f35SJunchao Zhang } 4509d67d9f35SJunchao Zhang 4510d67d9f35SJunchao Zhang /*@C 4511d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4512d67d9f35SJunchao Zhang 4513d67d9f35SJunchao Zhang Not Collective 4514d67d9f35SJunchao Zhang 4515d67d9f35SJunchao Zhang Input Parameter: 4516d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4517d67d9f35SJunchao Zhang 4518d67d9f35SJunchao Zhang Output Parameter: 4519d67d9f35SJunchao Zhang . array - pointer to the data 4520d67d9f35SJunchao Zhang 4521d67d9f35SJunchao Zhang Level: intermediate 4522d67d9f35SJunchao Zhang 4523db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4524d67d9f35SJunchao Zhang @*/ 4525d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array) 4526d71ae5a4SJacob Faibussowitsch { 4527d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4528d67d9f35SJunchao Zhang 4529d67d9f35SJunchao Zhang PetscFunctionBegin; 4530d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45319566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4532d67d9f35SJunchao Zhang } else { 4533d67d9f35SJunchao Zhang *array = NULL; 4534d67d9f35SJunchao Zhang } 45358f1ea47aSStefano Zampini PetscFunctionReturn(0); 45368f1ea47aSStefano Zampini } 45378f1ea47aSStefano Zampini 45388f1ea47aSStefano Zampini /*@C 453911a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45407ee59b9bSJunchao Zhang 45417ee59b9bSJunchao Zhang Not Collective 45427ee59b9bSJunchao Zhang 45437ee59b9bSJunchao Zhang Input Parameter: 454411a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45457ee59b9bSJunchao Zhang 45467ee59b9bSJunchao Zhang Output Parameters: 45477ee59b9bSJunchao Zhang + i - row map array of the matrix 45487ee59b9bSJunchao Zhang . j - column index array of the matrix 45497ee59b9bSJunchao Zhang . a - data array of the matrix 45507ee59b9bSJunchao Zhang - memtype - memory type of the arrays 45517ee59b9bSJunchao Zhang 45527ee59b9bSJunchao Zhang Notes: 45537ee59b9bSJunchao Zhang Any of the output parameters can be NULL, in which case the corresponding value is not returned. 45547ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45557ee59b9bSJunchao Zhang 45567ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45577ee59b9bSJunchao Zhang If the matrix is assembled, the data array 'a' is guaranteed to have the latest values of the matrix. 45587ee59b9bSJunchao Zhang 45597ee59b9bSJunchao Zhang Level: Developer 45607ee59b9bSJunchao Zhang 4561db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45627ee59b9bSJunchao Zhang @*/ 4563d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype) 4564d71ae5a4SJacob Faibussowitsch { 45657ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45667ee59b9bSJunchao Zhang 45677ee59b9bSJunchao Zhang PetscFunctionBegin; 45687ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45697ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45707ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45717ee59b9bSJunchao Zhang } else { 45727ee59b9bSJunchao Zhang if (i) *i = aij->i; 45737ee59b9bSJunchao Zhang if (j) *j = aij->j; 45747ee59b9bSJunchao Zhang if (a) *a = aij->a; 45757ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 45767ee59b9bSJunchao Zhang } 45777ee59b9bSJunchao Zhang PetscFunctionReturn(0); 45787ee59b9bSJunchao Zhang } 45797ee59b9bSJunchao Zhang 45807ee59b9bSJunchao Zhang /*@C 458121e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 458221e72a00SBarry Smith 458321e72a00SBarry Smith Not Collective 458421e72a00SBarry Smith 458521e72a00SBarry Smith Input Parameter: 458611a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 458721e72a00SBarry Smith 458821e72a00SBarry Smith Output Parameter: 458921e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 459021e72a00SBarry Smith 459121e72a00SBarry Smith Level: intermediate 459221e72a00SBarry Smith 4593db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 459421e72a00SBarry Smith @*/ 4595d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4596d71ae5a4SJacob Faibussowitsch { 459721e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 459821e72a00SBarry Smith 459921e72a00SBarry Smith PetscFunctionBegin; 460021e72a00SBarry Smith *nz = aij->rmax; 460121e72a00SBarry Smith PetscFunctionReturn(0); 460221e72a00SBarry Smith } 460321e72a00SBarry Smith 4604d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4605d71ae5a4SJacob Faibussowitsch { 4606394ed5ebSJunchao Zhang MPI_Comm comm; 4607394ed5ebSJunchao Zhang PetscInt *i, *j; 4608394ed5ebSJunchao Zhang PetscInt M, N, row; 4609394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4610394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4611394ed5ebSJunchao Zhang PetscInt *Aj; 4612394ed5ebSJunchao Zhang PetscScalar *Aa; 4613cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)(mat->data); 4614cbc6b225SStefano Zampini MatType rtype; 4615394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 4616394ed5ebSJunchao Zhang 4617394ed5ebSJunchao Zhang PetscFunctionBegin; 46189566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(mat)); 46199566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46209566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4621e8729f6fSJunchao Zhang i = coo_i; 4622e8729f6fSJunchao Zhang j = coo_j; 46239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 4624394ed5ebSJunchao Zhang for (k = 0; k < coo_n; k++) { /* Ignore entries with negative row or col indices */ 4625394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4626394ed5ebSJunchao Zhang perm[k] = k; 4627394ed5ebSJunchao Zhang } 4628394ed5ebSJunchao Zhang 4629394ed5ebSJunchao Zhang /* Sort by row */ 46309566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 46319371c9d4SSatish Balay for (k = 0; k < coo_n; k++) { 46329371c9d4SSatish Balay if (i[k] >= 0) break; 46339371c9d4SSatish Balay } /* Advance k to the first row with a non-negative index */ 4634394ed5ebSJunchao Zhang nneg = k; 46359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4636394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 4637394ed5ebSJunchao Zhang jmap++; /* Inc jmap by 1 for convinience */ 4638394ed5ebSJunchao Zhang 46399566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M + 1, &Ai)); /* CSR of A */ 46409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4641394ed5ebSJunchao Zhang 4642394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 4643394ed5ebSJunchao Zhang Ai++; /* Inc by 1 for convinience */ 4644394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4645394ed5ebSJunchao Zhang while (k < coo_n) { 4646394ed5ebSJunchao Zhang row = i[k]; 4647394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4648394ed5ebSJunchao Zhang while (k < coo_n && i[k] == row) k++; 4649394ed5ebSJunchao Zhang end = k; 46509566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4651394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4652394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4653394ed5ebSJunchao Zhang jmap[q] = 1; /* Number of repeats of this nozero entry */ 4654394ed5ebSJunchao Zhang Ai[row] = 1; 4655394ed5ebSJunchao Zhang nnz++; 4656394ed5ebSJunchao Zhang 4657394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4658394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4659394ed5ebSJunchao Zhang q++; 4660394ed5ebSJunchao Zhang jmap[q] = 1; 4661394ed5ebSJunchao Zhang Aj[q] = j[p]; 4662394ed5ebSJunchao Zhang Ai[row]++; 4663394ed5ebSJunchao Zhang nnz++; 4664394ed5ebSJunchao Zhang } else { 4665394ed5ebSJunchao Zhang jmap[q]++; 4666394ed5ebSJunchao Zhang } 4667394ed5ebSJunchao Zhang } 4668394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4669394ed5ebSJunchao Zhang } 4670394ed5ebSJunchao Zhang 4671394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4672394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 4673394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4674394ed5ebSJunchao Zhang jmap[0] = 0; 4675394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 4676394ed5ebSJunchao Zhang if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */ 4677394ed5ebSJunchao Zhang PetscCount *jmap_new; 4678394ed5ebSJunchao Zhang PetscInt *Aj_new; 4679394ed5ebSJunchao Zhang 46809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 46819566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 46829566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4683394ed5ebSJunchao Zhang jmap = jmap_new; 4684394ed5ebSJunchao Zhang 46859566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &Aj_new)); 46869566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 46879566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4688394ed5ebSJunchao Zhang Aj = Aj_new; 4689394ed5ebSJunchao Zhang } 4690394ed5ebSJunchao Zhang 4691394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4692394ed5ebSJunchao Zhang PetscCount *perm_new; 4693cbc6b225SStefano Zampini 46949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 46959566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 46969566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4697394ed5ebSJunchao Zhang perm = perm_new; 4698394ed5ebSJunchao Zhang } 4699394ed5ebSJunchao Zhang 47009566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 47019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */ 47029566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4703394ed5ebSJunchao Zhang 4704394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4705394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 4706394ed5ebSJunchao Zhang /* Record COO fields */ 4707394ed5ebSJunchao Zhang seqaij->coo_n = coo_n; 4708394ed5ebSJunchao Zhang seqaij->Atot = coo_n - nneg; /* Annz is seqaij->nz, so no need to record that again */ 4709394ed5ebSJunchao Zhang seqaij->jmap = jmap; /* of length nnz+1 */ 4710394ed5ebSJunchao Zhang seqaij->perm = perm; 4711394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4712394ed5ebSJunchao Zhang } 4713394ed5ebSJunchao Zhang 4714d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4715d71ae5a4SJacob Faibussowitsch { 4716394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4717394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 4718394ed5ebSJunchao Zhang PetscCount *perm = aseq->perm, *jmap = aseq->jmap; 4719394ed5ebSJunchao Zhang PetscScalar *Aa; 4720394ed5ebSJunchao Zhang 4721394ed5ebSJunchao Zhang PetscFunctionBegin; 47229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4723394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4724b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4725b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4726b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4727394ed5ebSJunchao Zhang } 47289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 4729394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4730394ed5ebSJunchao Zhang } 4731394ed5ebSJunchao Zhang 473234b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47335063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 473402fe1965SBarry Smith #endif 47353d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47365063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 47373d0639e7SStefano Zampini #endif 473802fe1965SBarry Smith 4739d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4740d71ae5a4SJacob Faibussowitsch { 4741273d9f13SBarry Smith Mat_SeqAIJ *b; 474238baddfdSBarry Smith PetscMPIInt size; 4743273d9f13SBarry Smith 4744273d9f13SBarry Smith PetscFunctionBegin; 47459566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 474608401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4747273d9f13SBarry Smith 47484dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 47492205254eSKarl Rupp 4750b0a32e0cSBarry Smith B->data = (void *)b; 47512205254eSKarl Rupp 47529566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps))); 4753071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 47542205254eSKarl Rupp 4755f4259b30SLisandro Dalcin b->row = NULL; 4756f4259b30SLisandro Dalcin b->col = NULL; 4757f4259b30SLisandro Dalcin b->icol = NULL; 4758b810aeb4SBarry Smith b->reallocs = 0; 475936db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4760f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4761416022c9SBarry Smith b->nonew = 0; 4762f4259b30SLisandro Dalcin b->diag = NULL; 4763f4259b30SLisandro Dalcin b->solve_work = NULL; 4764f4259b30SLisandro Dalcin B->spptr = NULL; 4765f4259b30SLisandro Dalcin b->saved_values = NULL; 4766f4259b30SLisandro Dalcin b->idiag = NULL; 4767f4259b30SLisandro Dalcin b->mdiag = NULL; 4768f4259b30SLisandro Dalcin b->ssor_work = NULL; 476971f1c65dSBarry Smith b->omega = 1.0; 477071f1c65dSBarry Smith b->fshift = 0.0; 477171f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4772bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4773a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 477417ab2063SBarry Smith 47759566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4776d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 47779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 47789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4779b3866ffcSBarry Smith #endif 47809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 47819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 47829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 47839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 47849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 47859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 47869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 47879779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 47889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4789191b95cbSRichard Tran Mills #endif 479034b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 47929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 47939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 479402fe1965SBarry Smith #endif 47953d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 47973d0639e7SStefano Zampini #endif 47989566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4799af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 48009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4801af8000cdSHong Zhang #endif 4802d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 48039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4804d24d4204SJose E. Roman #endif 480563c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 48069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 48079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 480863c07aadSStefano Zampini #endif 48099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 48109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 48119566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 48129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 48139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsTranspose_SeqAIJ)); 48149566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 48159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 48169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 48179566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 48189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 48199566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 48209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48219566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 48229566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 48239566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 48249566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 48259566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 48269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 48273a40ed3dSBarry Smith PetscFunctionReturn(0); 482817ab2063SBarry Smith } 482917ab2063SBarry Smith 4830b24902e0SBarry Smith /* 48313893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4832b24902e0SBarry Smith */ 4833d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4834d71ae5a4SJacob Faibussowitsch { 48352a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4836071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 483717ab2063SBarry Smith 48383a40ed3dSBarry Smith PetscFunctionBegin; 4839aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4840273d9f13SBarry Smith 4841d5f3da31SBarry Smith C->factortype = A->factortype; 4842f4259b30SLisandro Dalcin c->row = NULL; 4843f4259b30SLisandro Dalcin c->col = NULL; 4844f4259b30SLisandro Dalcin c->icol = NULL; 48456ad4291fSHong Zhang c->reallocs = 0; 484617ab2063SBarry Smith 484769272f91SPierre Jolivet C->assembled = A->assembled; 484869272f91SPierre Jolivet C->preallocated = A->preallocated; 484917ab2063SBarry Smith 485069272f91SPierre Jolivet if (A->preallocated) { 48519566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 48529566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4853eec197d1SBarry Smith 48549566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 48559566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 48569566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 48579566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 485817ab2063SBarry Smith 485917ab2063SBarry Smith /* allocate the matrix space */ 4860f77e22a1SHong Zhang if (mallocmatspace) { 48619566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i)); 48622205254eSKarl Rupp 4863f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 48642205254eSKarl Rupp 48659566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 486617ab2063SBarry Smith if (m > 0) { 48679566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4868be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 48692e5835c6SStefano Zampini const PetscScalar *aa; 48702e5835c6SStefano Zampini 48719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 48729566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 48739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 4874be6bf707SBarry Smith } else { 48759566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 487617ab2063SBarry Smith } 487708480c60SBarry Smith } 4878f77e22a1SHong Zhang } 487917ab2063SBarry Smith 48806ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4881416022c9SBarry Smith c->roworiented = a->roworiented; 4882416022c9SBarry Smith c->nonew = a->nonew; 4883416022c9SBarry Smith if (a->diag) { 48849566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 48859566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 4886071fcb05SBarry Smith } else c->diag = NULL; 48872205254eSKarl Rupp 4888f4259b30SLisandro Dalcin c->solve_work = NULL; 4889f4259b30SLisandro Dalcin c->saved_values = NULL; 4890f4259b30SLisandro Dalcin c->idiag = NULL; 4891f4259b30SLisandro Dalcin c->ssor_work = NULL; 4892a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4893e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4894e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 48956ad4291fSHong Zhang 4896893ad86cSHong Zhang c->rmax = a->rmax; 4897416022c9SBarry Smith c->nz = a->nz; 48988ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4899754ec7b1SSatish Balay 49006ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 49016ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4902cd6b891eSBarry Smith if (a->compressedrow.use) { 49036ad4291fSHong Zhang i = a->compressedrow.nrows; 49049566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 49059566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 49069566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 490727ea64f8SHong Zhang } else { 490827ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 49090298fd71SBarry Smith c->compressedrow.i = NULL; 49100298fd71SBarry Smith c->compressedrow.rindex = NULL; 49116ad4291fSHong Zhang } 4912ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4913e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 49144846f1f5SKris Buschelman 49159566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 491669272f91SPierre Jolivet } 49179566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 49183a40ed3dSBarry Smith PetscFunctionReturn(0); 491917ab2063SBarry Smith } 492017ab2063SBarry Smith 4921d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 4922d71ae5a4SJacob Faibussowitsch { 4923b24902e0SBarry Smith PetscFunctionBegin; 49249566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 49259566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 492648a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 49279566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 49289566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 4929b24902e0SBarry Smith PetscFunctionReturn(0); 4930b24902e0SBarry Smith } 4931b24902e0SBarry Smith 4932d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4933d71ae5a4SJacob Faibussowitsch { 493452f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 493552f91c60SVaclav Hapla 493652f91c60SVaclav Hapla PetscFunctionBegin; 493752f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 493852f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 4939c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 49409566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 49419566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 49429566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 494352f91c60SVaclav Hapla if (isbinary) { 49449566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 494552f91c60SVaclav Hapla } else if (ishdf5) { 494652f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 49479566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 494852f91c60SVaclav Hapla #else 494952f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 495052f91c60SVaclav Hapla #endif 495152f91c60SVaclav Hapla } else { 495298921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 495352f91c60SVaclav Hapla } 495452f91c60SVaclav Hapla PetscFunctionReturn(0); 495552f91c60SVaclav Hapla } 495652f91c60SVaclav Hapla 4957d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 4958d71ae5a4SJacob Faibussowitsch { 49593ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 49603ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 4961fbdbba38SShri Abhyankar 4962fbdbba38SShri Abhyankar PetscFunctionBegin; 49639566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 4964bbead8a2SBarry Smith 49653ea6fe3dSLisandro Dalcin /* read in matrix header */ 49669566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 496708401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 49689371c9d4SSatish Balay M = header[1]; 49699371c9d4SSatish Balay N = header[2]; 49709371c9d4SSatish Balay nz = header[3]; 497108401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 497208401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 497308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 4974fbdbba38SShri Abhyankar 49753ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 49769566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 49773ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 49783ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 49793ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 49803ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 49813ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 49829566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 49839566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 49843ea6fe3dSLisandro Dalcin 49853ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 49869566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 4987aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 49883ea6fe3dSLisandro Dalcin 4989fbdbba38SShri Abhyankar /* read in row lengths */ 49909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 49919566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 49923ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 49939371c9d4SSatish Balay sum = 0; 49949371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 499508401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 49963ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 49979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 49989566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 4999aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 50003ea6fe3dSLisandro Dalcin /* store row lengths */ 50019566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 50029566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5003fbdbba38SShri Abhyankar 50043ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 50059371c9d4SSatish Balay a->i[0] = 0; 50069371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 50073ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 50089566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 50093ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 50109566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5011fbdbba38SShri Abhyankar 50129566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 50139566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 5014fbdbba38SShri Abhyankar PetscFunctionReturn(0); 5015fbdbba38SShri Abhyankar } 5016fbdbba38SShri Abhyankar 5017d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5018d71ae5a4SJacob Faibussowitsch { 50197264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5020fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5021eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5022eeffb40dSHong Zhang PetscInt k; 5023eeffb40dSHong Zhang #endif 50247264ac53SSatish Balay 50253a40ed3dSBarry Smith PetscFunctionBegin; 5026bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5027d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5028ca44d042SBarry Smith *flg = PETSC_FALSE; 5029ca44d042SBarry Smith PetscFunctionReturn(0); 5030bcd2baecSBarry Smith } 50317264ac53SSatish Balay 50327264ac53SSatish Balay /* if the a->i are the same */ 50339566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 5034abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 50357264ac53SSatish Balay 50367264ac53SSatish Balay /* if a->j are the same */ 50379566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 5038abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 5039bcd2baecSBarry Smith 50409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5042bcd2baecSBarry Smith /* if a->a are the same */ 5043eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5044eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5045fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5046eeffb40dSHong Zhang *flg = PETSC_FALSE; 50473a40ed3dSBarry Smith PetscFunctionReturn(0); 5048eeffb40dSHong Zhang } 5049eeffb40dSHong Zhang } 5050eeffb40dSHong Zhang #else 50519566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5052eeffb40dSHong Zhang #endif 50539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 50549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 5055eeffb40dSHong Zhang PetscFunctionReturn(0); 50567264ac53SSatish Balay } 505736db0b34SBarry Smith 505805869f15SSatish Balay /*@ 505911a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 506036db0b34SBarry Smith provided by the user. 506136db0b34SBarry Smith 5062d083f849SBarry Smith Collective 506336db0b34SBarry Smith 506436db0b34SBarry Smith Input Parameters: 506536db0b34SBarry Smith + comm - must be an MPI communicator of size 1 506636db0b34SBarry Smith . m - number of rows 506736db0b34SBarry Smith . n - number of columns 5068483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 506936db0b34SBarry Smith . j - column indices 507036db0b34SBarry Smith - a - matrix values 507136db0b34SBarry Smith 507236db0b34SBarry Smith Output Parameter: 507336db0b34SBarry Smith . mat - the matrix 507436db0b34SBarry Smith 507536db0b34SBarry Smith Level: intermediate 507636db0b34SBarry Smith 507736db0b34SBarry Smith Notes: 50780551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 5079292fb18eSBarry Smith once the matrix is destroyed and not before 508036db0b34SBarry Smith 508136db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 508236db0b34SBarry Smith 5083bfeeae90SHong Zhang The i and j indices are 0 based 508436db0b34SBarry Smith 5085a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5086a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 50878eef79e4SBarry Smith as shown 5088a4552177SSatish Balay 50898eef79e4SBarry Smith $ 1 0 0 50908eef79e4SBarry Smith $ 2 0 3 50918eef79e4SBarry Smith $ 4 5 6 50928eef79e4SBarry Smith $ 50938eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 50948eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 50958eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 5096a4552177SSatish Balay 5097db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 509836db0b34SBarry Smith @*/ 5099d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5100d71ae5a4SJacob Faibussowitsch { 5101cbcfb4deSHong Zhang PetscInt ii; 510236db0b34SBarry Smith Mat_SeqAIJ *aij; 5103cbcfb4deSHong Zhang PetscInt jj; 510436db0b34SBarry Smith 510536db0b34SBarry Smith PetscFunctionBegin; 5106aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 51079566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51089566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51099566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 51109566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5112ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 51139566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 51149566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5115ab93d7beSBarry Smith 511636db0b34SBarry Smith aij->i = i; 511736db0b34SBarry Smith aij->j = j; 511836db0b34SBarry Smith aij->a = a; 511936db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 512036db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5121e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5122e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 512336db0b34SBarry Smith 5124cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 512536db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 512676bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5127aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 51289985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 512908401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 513008401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 51319985e31cSBarry Smith } 513236db0b34SBarry Smith } 513376bd3646SJed Brown } 513476bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 513536db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 513608401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5137aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 513836db0b34SBarry Smith } 513976bd3646SJed Brown } 514036db0b34SBarry Smith 51419566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 51429566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 514336db0b34SBarry Smith PetscFunctionReturn(0); 514436db0b34SBarry Smith } 5145cbc6b225SStefano Zampini 5146f62e3866SBarry Smith /*@ 514711a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 51488a0b0e6bSVictor Minden provided by the user. 51498a0b0e6bSVictor Minden 5150d083f849SBarry Smith Collective 51518a0b0e6bSVictor Minden 51528a0b0e6bSVictor Minden Input Parameters: 51538a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 51548a0b0e6bSVictor Minden . m - number of rows 51558a0b0e6bSVictor Minden . n - number of columns 51568a0b0e6bSVictor Minden . i - row indices 51578a0b0e6bSVictor Minden . j - column indices 51581230e6d1SVictor Minden . a - matrix values 51591230e6d1SVictor Minden . nz - number of nonzeros 516011a5261eSBarry Smith - idx - if the i and j indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 51618a0b0e6bSVictor Minden 51628a0b0e6bSVictor Minden Output Parameter: 51638a0b0e6bSVictor Minden . mat - the matrix 51648a0b0e6bSVictor Minden 51658a0b0e6bSVictor Minden Level: intermediate 51668a0b0e6bSVictor Minden 5167f62e3866SBarry Smith Example: 5168f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 51699e99939fSJunchao Zhang .vb 51708a0b0e6bSVictor Minden 1 0 0 51718a0b0e6bSVictor Minden 2 0 3 51728a0b0e6bSVictor Minden 4 5 6 51738a0b0e6bSVictor Minden 51748a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 51758a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 51768a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 51779e99939fSJunchao Zhang .ve 5178d7547e51SJunchao Zhang Notes: 5179d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5180d7547e51SJunchao Zhang and are particularly useful in iterative applications. 51818a0b0e6bSVictor Minden 5182d7547e51SJunchao Zhang .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 51838a0b0e6bSVictor Minden @*/ 5184d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5185d71ae5a4SJacob Faibussowitsch { 5186d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 51878a0b0e6bSVictor Minden 51888a0b0e6bSVictor Minden PetscFunctionBegin; 51899566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5190ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 51919566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51929566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51939566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 51951230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 51961230e6d1SVictor Minden if (idx) { 51971230e6d1SVictor Minden row = i[ii] - 1; 51981230e6d1SVictor Minden col = j[ii] - 1; 51991230e6d1SVictor Minden } else { 52001230e6d1SVictor Minden row = i[ii]; 52011230e6d1SVictor Minden col = j[ii]; 52028a0b0e6bSVictor Minden } 52039566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 52048a0b0e6bSVictor Minden } 52059566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52069566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52079566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 52088a0b0e6bSVictor Minden PetscFunctionReturn(0); 52098a0b0e6bSVictor Minden } 521036db0b34SBarry Smith 5211d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5212d71ae5a4SJacob Faibussowitsch { 5213acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5214acf2f550SJed Brown 5215acf2f550SJed Brown PetscFunctionBegin; 5216acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5217acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 52182205254eSKarl Rupp 52199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 5220acf2f550SJed Brown PetscFunctionReturn(0); 5221acf2f550SJed Brown } 5222acf2f550SJed Brown 5223d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5224d71ae5a4SJacob Faibussowitsch { 52259c8f2541SHong Zhang PetscFunctionBegin; 52269566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 52279c8f2541SHong Zhang PetscFunctionReturn(0); 52289c8f2541SHong Zhang } 52299c8f2541SHong Zhang 523081824310SBarry Smith /* 523153dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 523253dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 523353dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 523453dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 523553dd7562SDmitry Karpeev */ 5236d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5237d71ae5a4SJacob Faibussowitsch { 523853dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 523953dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 524053dd7562SDmitry Karpeev PetscBool seqaij; 524153dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 524253dd7562SDmitry Karpeev PetscScalar v; 524353dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 524453dd7562SDmitry Karpeev 524553dd7562SDmitry Karpeev PetscFunctionBegin; 524653dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 524753dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 52489566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 524928b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 525053dd7562SDmitry Karpeev if (rowemb) { 52519566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 525208401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 525353dd7562SDmitry Karpeev } else { 525408401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 525553dd7562SDmitry Karpeev } 525653dd7562SDmitry Karpeev if (colemb) { 52579566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 525808401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 525953dd7562SDmitry Karpeev } else { 526008401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 526153dd7562SDmitry Karpeev } 526253dd7562SDmitry Karpeev 526353dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ *)(B->data); 526453dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 52659566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5266ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 52679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 52689566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 526953dd7562SDmitry Karpeev } 527048a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 527153dd7562SDmitry Karpeev count = 0; 527253dd7562SDmitry Karpeev rowindices = NULL; 527353dd7562SDmitry Karpeev colindices = NULL; 527448a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 527548a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 527653dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 527753dd7562SDmitry Karpeev PetscInt row; 527853dd7562SDmitry Karpeev row = i; 527953dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 528053dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 528153dd7562SDmitry Karpeev PetscInt col; 528253dd7562SDmitry Karpeev col = Baij->j[count]; 528353dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 528453dd7562SDmitry Karpeev v = Baij->a[count]; 52859566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 528653dd7562SDmitry Karpeev ++count; 528753dd7562SDmitry Karpeev } 528853dd7562SDmitry Karpeev } 528953dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 529053dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 529153dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 529253dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 529353dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 529453dd7562SDmitry Karpeev PetscFunctionReturn(0); 529553dd7562SDmitry Karpeev } 529653dd7562SDmitry Karpeev 52974099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 52984099cc6bSBarry Smith 52994099cc6bSBarry Smith /*@C 530011a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 53014099cc6bSBarry Smith 5302c3339decSBarry Smith Collective 53034099cc6bSBarry Smith 53044099cc6bSBarry Smith Input Parameters: 53054099cc6bSBarry Smith + mat - the matrix object 53064099cc6bSBarry Smith - matype - matrix type 53074099cc6bSBarry Smith 53084099cc6bSBarry Smith Options Database Key: 53094099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 53104099cc6bSBarry Smith 53114099cc6bSBarry Smith Level: intermediate 53124099cc6bSBarry Smith 5313db781477SPatrick Sanan .seealso: `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`, `Mat` 53144099cc6bSBarry Smith @*/ 5315d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5316d71ae5a4SJacob Faibussowitsch { 53174099cc6bSBarry Smith PetscBool sametype; 53185f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 53194099cc6bSBarry Smith 53204099cc6bSBarry Smith PetscFunctionBegin; 53214099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 53229566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 53234099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 53244099cc6bSBarry Smith 53259566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 53265f80ce2aSJacob Faibussowitsch PetscCheck(r, PETSC_COMM_SELF, PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 53279566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 53284099cc6bSBarry Smith PetscFunctionReturn(0); 53294099cc6bSBarry Smith } 53304099cc6bSBarry Smith 53314099cc6bSBarry Smith /*@C 533211a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 53334099cc6bSBarry Smith 53344099cc6bSBarry Smith Not Collective 53354099cc6bSBarry Smith 53364099cc6bSBarry Smith Input Parameters: 533711a5261eSBarry Smith + name - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 53384099cc6bSBarry Smith - function - routine to convert to subtype 53394099cc6bSBarry Smith 53404099cc6bSBarry Smith Notes: 534111a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 53424099cc6bSBarry Smith 53434099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 53444099cc6bSBarry Smith $ -mat_seqaij_type my_mat 53454099cc6bSBarry Smith 53464099cc6bSBarry Smith Level: advanced 53474099cc6bSBarry Smith 5348db781477SPatrick Sanan .seealso: `MatSeqAIJRegisterAll()` 53494099cc6bSBarry Smith @*/ 5350d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5351d71ae5a4SJacob Faibussowitsch { 53524099cc6bSBarry Smith PetscFunctionBegin; 53539566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 53549566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 53554099cc6bSBarry Smith PetscFunctionReturn(0); 53564099cc6bSBarry Smith } 53574099cc6bSBarry Smith 53584099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 53594099cc6bSBarry Smith 53604099cc6bSBarry Smith /*@C 536111a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 53624099cc6bSBarry Smith 53634099cc6bSBarry Smith Not Collective 53644099cc6bSBarry Smith 53654099cc6bSBarry Smith Level: advanced 53664099cc6bSBarry Smith 5367db781477SPatrick Sanan .seealso: `MatRegisterAll()`, `MatSeqAIJRegister()` 53684099cc6bSBarry Smith @*/ 5369d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5370d71ae5a4SJacob Faibussowitsch { 53714099cc6bSBarry Smith PetscFunctionBegin; 53724099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 53734099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 53744099cc6bSBarry Smith 53759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 53769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 53779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 53789779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 53799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5380485f9817SRichard Tran Mills #endif 53815063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 53829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 53835063d097SStefano Zampini #endif 53845063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 53859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 53865063d097SStefano Zampini #endif 53874099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 53889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 53894099cc6bSBarry Smith #endif 53904099cc6bSBarry Smith PetscFunctionReturn(0); 53914099cc6bSBarry Smith } 539253dd7562SDmitry Karpeev 539353dd7562SDmitry Karpeev /* 539481824310SBarry Smith Special version for direct calls from Fortran 539581824310SBarry Smith */ 5396af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 539781824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 539881824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 539981824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 540081824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 540181824310SBarry Smith #endif 540281824310SBarry Smith 540381824310SBarry Smith /* Change these macros so can be used in void function */ 540498921bdaSJacob Faibussowitsch 540598921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 54069566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 54079566063dSJacob Faibussowitsch #undef PetscCall 54089371c9d4SSatish Balay #define PetscCall(...) \ 54099371c9d4SSatish Balay do { \ 54105f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 541198921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 541298921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 541398921bdaSJacob Faibussowitsch return; \ 541498921bdaSJacob Faibussowitsch } \ 541598921bdaSJacob Faibussowitsch } while (0) 541698921bdaSJacob Faibussowitsch 541798921bdaSJacob Faibussowitsch #undef SETERRQ 54189371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 54199371c9d4SSatish Balay do { \ 542098921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 542198921bdaSJacob Faibussowitsch return; \ 542298921bdaSJacob Faibussowitsch } while (0) 542381824310SBarry Smith 5424d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5425d71ae5a4SJacob Faibussowitsch { 542681824310SBarry Smith Mat A = *AA; 542781824310SBarry Smith PetscInt m = *mm, n = *nn; 542881824310SBarry Smith InsertMode is = *isis; 542981824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 543081824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 543181824310SBarry Smith PetscInt *imax, *ai, *ailen; 543281824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 543354f21887SBarry Smith MatScalar *ap, value, *aa; 5434ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5435ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 543681824310SBarry Smith 543781824310SBarry Smith PetscFunctionBegin; 54384994cf47SJed Brown MatCheckPreallocated(A, 1); 543981824310SBarry Smith imax = a->imax; 544081824310SBarry Smith ai = a->i; 544181824310SBarry Smith ailen = a->ilen; 544281824310SBarry Smith aj = a->j; 544381824310SBarry Smith aa = a->a; 544481824310SBarry Smith 544581824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 544681824310SBarry Smith row = im[k]; 544781824310SBarry Smith if (row < 0) continue; 54485f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 54499371c9d4SSatish Balay rp = aj + ai[row]; 54509371c9d4SSatish Balay ap = aa + ai[row]; 54519371c9d4SSatish Balay rmax = imax[row]; 54529371c9d4SSatish Balay nrow = ailen[row]; 545381824310SBarry Smith low = 0; 545481824310SBarry Smith high = nrow; 545581824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 545681824310SBarry Smith if (in[l] < 0) continue; 54575f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 545881824310SBarry Smith col = in[l]; 54592205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 54602205254eSKarl Rupp else value = v[k + l * m]; 54612205254eSKarl Rupp 546281824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 546381824310SBarry Smith 54642205254eSKarl Rupp if (col <= lastcol) low = 0; 54652205254eSKarl Rupp else high = nrow; 546681824310SBarry Smith lastcol = col; 546781824310SBarry Smith while (high - low > 5) { 546881824310SBarry Smith t = (low + high) / 2; 546981824310SBarry Smith if (rp[t] > col) high = t; 547081824310SBarry Smith else low = t; 547181824310SBarry Smith } 547281824310SBarry Smith for (i = low; i < high; i++) { 547381824310SBarry Smith if (rp[i] > col) break; 547481824310SBarry Smith if (rp[i] == col) { 547581824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 547681824310SBarry Smith else ap[i] = value; 547781824310SBarry Smith goto noinsert; 547881824310SBarry Smith } 547981824310SBarry Smith } 548081824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 548181824310SBarry Smith if (nonew == 1) goto noinsert; 54825f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5483fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 54849371c9d4SSatish Balay N = nrow++ - 1; 54859371c9d4SSatish Balay a->nz++; 54869371c9d4SSatish Balay high++; 548781824310SBarry Smith /* shift up all the later entries in this row */ 548881824310SBarry Smith for (ii = N; ii >= i; ii--) { 548981824310SBarry Smith rp[ii + 1] = rp[ii]; 549081824310SBarry Smith ap[ii + 1] = ap[ii]; 549181824310SBarry Smith } 549281824310SBarry Smith rp[i] = col; 549381824310SBarry Smith ap[i] = value; 5494e56f5c9eSBarry Smith A->nonzerostate++; 549581824310SBarry Smith noinsert:; 549681824310SBarry Smith low = i + 1; 549781824310SBarry Smith } 549881824310SBarry Smith ailen[row] = nrow; 549981824310SBarry Smith } 550081824310SBarry Smith PetscFunctionReturnVoid(); 550181824310SBarry Smith } 550298921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 550398921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 550498921bdaSJacob Faibussowitsch * original definitions */ 55059566063dSJacob Faibussowitsch #undef PetscCall 550698921bdaSJacob Faibussowitsch #undef SETERRQ 5507