1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 11d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 12d71ae5a4SJacob Faibussowitsch { 134099cc6bSBarry Smith PetscBool flg; 144099cc6bSBarry Smith char type[256]; 154099cc6bSBarry Smith 164099cc6bSBarry Smith PetscFunctionBegin; 17d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 189566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 199566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 20d0609cedSBarry Smith PetscOptionsEnd(); 214099cc6bSBarry Smith PetscFunctionReturn(0); 224099cc6bSBarry Smith } 234099cc6bSBarry Smith 24d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 25d71ae5a4SJacob Faibussowitsch { 260716a85fSBarry Smith PetscInt i, m, n; 270716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 280716a85fSBarry Smith 290716a85fSBarry Smith PetscFunctionBegin; 309566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 319566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 320716a85fSBarry Smith if (type == NORM_2) { 33ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 340716a85fSBarry Smith } else if (type == NORM_1) { 35ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 360716a85fSBarry Smith } else if (type == NORM_INFINITY) { 37ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 38857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 39ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 40857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 42857cbf51SRichard Tran Mills } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 430716a85fSBarry Smith 440716a85fSBarry Smith if (type == NORM_2) { 45a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 47a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 480716a85fSBarry Smith } 490716a85fSBarry Smith PetscFunctionReturn(0); 500716a85fSBarry Smith } 510716a85fSBarry Smith 52d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 53d71ae5a4SJacob Faibussowitsch { 543a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 553a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 563a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 573a062f41SBarry Smith PetscInt *rows; 583a062f41SBarry Smith 593a062f41SBarry Smith PetscFunctionBegin; 603a062f41SBarry Smith for (i = 0; i < m; i++) { 61ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 623a062f41SBarry Smith } 639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 643a062f41SBarry Smith cnt = 0; 653a062f41SBarry Smith for (i = 0; i < m; i++) { 663a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 673a062f41SBarry Smith rows[cnt] = i; 683a062f41SBarry Smith cnt++; 693a062f41SBarry Smith } 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 723a062f41SBarry Smith PetscFunctionReturn(0); 733a062f41SBarry Smith } 743a062f41SBarry Smith 75d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 76d71ae5a4SJacob Faibussowitsch { 776ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 78fff043a9SJunchao Zhang const MatScalar *aa; 796ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 80b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 816ce1633cSBarry Smith PetscInt *rows; 826ce1633cSBarry Smith 836ce1633cSBarry Smith PetscFunctionBegin; 849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 859566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 866ce1633cSBarry Smith diag = a->diag; 876ce1633cSBarry Smith for (i = 0; i < m; i++) { 88ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 896ce1633cSBarry Smith } 909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 916ce1633cSBarry Smith cnt = 0; 926ce1633cSBarry Smith for (i = 0; i < m; i++) { 93ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 946ce1633cSBarry Smith } 95f1f41ecbSJed Brown *nrows = cnt; 96f1f41ecbSJed Brown *zrows = rows; 979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 98f1f41ecbSJed Brown PetscFunctionReturn(0); 99f1f41ecbSJed Brown } 100f1f41ecbSJed Brown 101d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 102d71ae5a4SJacob Faibussowitsch { 103f1f41ecbSJed Brown PetscInt nrows, *rows; 104f1f41ecbSJed Brown 105f1f41ecbSJed Brown PetscFunctionBegin; 1060298fd71SBarry Smith *zrows = NULL; 1079566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1089566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1096ce1633cSBarry Smith PetscFunctionReturn(0); 1106ce1633cSBarry Smith } 1116ce1633cSBarry Smith 112d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 113d71ae5a4SJacob Faibussowitsch { 114b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 115b3a44c85SBarry Smith const MatScalar *aa; 116b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 117b3a44c85SBarry Smith const PetscInt *ii; 118b3a44c85SBarry Smith PetscInt n, i, j, *rows; 119b3a44c85SBarry Smith 120b3a44c85SBarry Smith PetscFunctionBegin; 1219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 122f4259b30SLisandro Dalcin *keptrows = NULL; 123b3a44c85SBarry Smith ii = a->i; 124b3a44c85SBarry Smith for (i = 0; i < m; i++) { 125b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 126b3a44c85SBarry Smith if (!n) { 127b3a44c85SBarry Smith cnt++; 128b3a44c85SBarry Smith goto ok1; 129b3a44c85SBarry Smith } 1302e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 131b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 132b3a44c85SBarry Smith } 133b3a44c85SBarry Smith cnt++; 134b3a44c85SBarry Smith ok1:; 135b3a44c85SBarry Smith } 1362e5835c6SStefano Zampini if (!cnt) { 1379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1382e5835c6SStefano Zampini PetscFunctionReturn(0); 1392e5835c6SStefano Zampini } 1409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 141b3a44c85SBarry Smith cnt = 0; 142b3a44c85SBarry Smith for (i = 0; i < m; i++) { 143b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 144b3a44c85SBarry Smith if (!n) continue; 1452e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 146b3a44c85SBarry Smith if (aa[j] != 0.0) { 147b3a44c85SBarry Smith rows[cnt++] = i; 148b3a44c85SBarry Smith break; 149b3a44c85SBarry Smith } 150b3a44c85SBarry Smith } 151b3a44c85SBarry Smith } 1529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1539566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 154b3a44c85SBarry Smith PetscFunctionReturn(0); 155b3a44c85SBarry Smith } 156b3a44c85SBarry Smith 157d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 158d71ae5a4SJacob Faibussowitsch { 15979299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16099e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16199e65526SBarry Smith const PetscInt *diag; 1622e5835c6SStefano Zampini MatScalar *aa; 16399e65526SBarry Smith const PetscScalar *v; 164ace3abfcSBarry Smith PetscBool missing; 16579299369SBarry Smith 16679299369SBarry Smith PetscFunctionBegin; 16709f38230SBarry Smith if (Y->assembled) { 1689566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 16909f38230SBarry Smith if (!missing) { 17079299369SBarry Smith diag = aij->diag; 1719566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 17379299369SBarry Smith if (is == INSERT_VALUES) { 174ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 17579299369SBarry Smith } else { 176ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 17779299369SBarry Smith } 1789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1799566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 18079299369SBarry Smith PetscFunctionReturn(0); 18179299369SBarry Smith } 1829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 18309f38230SBarry Smith } 1849566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 18509f38230SBarry Smith PetscFunctionReturn(0); 18609f38230SBarry Smith } 18779299369SBarry Smith 188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 189d71ae5a4SJacob Faibussowitsch { 190416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19197f1f81fSBarry Smith PetscInt i, ishift; 19217ab2063SBarry Smith 1933a40ed3dSBarry Smith PetscFunctionBegin; 194f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 1953a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 196bfeeae90SHong Zhang ishift = 0; 197b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 1989566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 199bfeeae90SHong Zhang } else if (oshift == 1) { 2001a83f524SJed Brown PetscInt *tia; 201d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2023b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2041a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2051a83f524SJed Brown *ia = tia; 206ecc77c7aSBarry Smith if (ja) { 2071a83f524SJed Brown PetscInt *tja; 2089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2091a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2101a83f524SJed Brown *ja = tja; 211ecc77c7aSBarry Smith } 2126945ee14SBarry Smith } else { 213ecc77c7aSBarry Smith *ia = a->i; 214ecc77c7aSBarry Smith if (ja) *ja = a->j; 215a2ce50c7SBarry Smith } 2163a40ed3dSBarry Smith PetscFunctionReturn(0); 217a2744918SBarry Smith } 218a2744918SBarry Smith 219d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 220d71ae5a4SJacob Faibussowitsch { 2213a40ed3dSBarry Smith PetscFunctionBegin; 2223a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 223b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2249566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2259566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 226bcd2baecSBarry Smith } 2273a40ed3dSBarry Smith PetscFunctionReturn(0); 22817ab2063SBarry Smith } 22917ab2063SBarry Smith 230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 231d71ae5a4SJacob Faibussowitsch { 2323b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 233d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 23497f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2353b2fbd54SBarry Smith 2363a40ed3dSBarry Smith PetscFunctionBegin; 237899cda47SBarry Smith *nn = n; 2383a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2393b2fbd54SBarry Smith if (symmetric) { 2409566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2413b2fbd54SBarry Smith } else { 2429566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2453b2fbd54SBarry Smith jj = a->j; 246ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2473b2fbd54SBarry Smith cia[0] = oshift; 248ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2499566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2503b2fbd54SBarry Smith jj = a->j; 251a93ec695SBarry Smith for (row = 0; row < m; row++) { 252a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 253a93ec695SBarry Smith for (i = 0; i < mr; i++) { 254bfeeae90SHong Zhang col = *jj++; 2552205254eSKarl Rupp 2563b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2573b2fbd54SBarry Smith } 2583b2fbd54SBarry Smith } 2599566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2609371c9d4SSatish Balay *ia = cia; 2619371c9d4SSatish Balay *ja = cja; 2623b2fbd54SBarry Smith } 2633a40ed3dSBarry Smith PetscFunctionReturn(0); 2643b2fbd54SBarry Smith } 2653b2fbd54SBarry Smith 266d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 267d71ae5a4SJacob Faibussowitsch { 2683a40ed3dSBarry Smith PetscFunctionBegin; 2693a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2703b2fbd54SBarry Smith 2719566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2729566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2733a40ed3dSBarry Smith PetscFunctionReturn(0); 2743b2fbd54SBarry Smith } 2753b2fbd54SBarry Smith 2767cee066cSHong Zhang /* 2777cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2787cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 279040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2807cee066cSHong Zhang */ 281d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 282d71ae5a4SJacob Faibussowitsch { 2837cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2847cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 285071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2867cee066cSHong Zhang PetscInt *cspidx; 287071fcb05SBarry Smith const PetscInt *jj; 2887cee066cSHong Zhang 2897cee066cSHong Zhang PetscFunctionBegin; 2907cee066cSHong Zhang *nn = n; 2917cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 292625f6d37SHong Zhang 2939566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2959566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2969566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 2977cee066cSHong Zhang jj = a->j; 298ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2997cee066cSHong Zhang cia[0] = oshift; 300ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3019566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3027cee066cSHong Zhang jj = a->j; 3037cee066cSHong Zhang for (row = 0; row < m; row++) { 3047cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3057cee066cSHong Zhang for (i = 0; i < mr; i++) { 3067cee066cSHong Zhang col = *jj++; 307071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 308071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 309071fcb05SBarry Smith cja[tmp] = row + oshift; 3107cee066cSHong Zhang } 3117cee066cSHong Zhang } 3129566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 313071fcb05SBarry Smith *ia = cia; 314071fcb05SBarry Smith *ja = cja; 3157cee066cSHong Zhang *spidx = cspidx; 3167cee066cSHong Zhang PetscFunctionReturn(0); 3177cee066cSHong Zhang } 3187cee066cSHong Zhang 319d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 320d71ae5a4SJacob Faibussowitsch { 3217cee066cSHong Zhang PetscFunctionBegin; 3229566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3239566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3247cee066cSHong Zhang PetscFunctionReturn(0); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 328d71ae5a4SJacob Faibussowitsch { 32987d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33087d4246cSBarry Smith PetscInt *ai = a->i; 331fff043a9SJunchao Zhang PetscScalar *aa; 33287d4246cSBarry Smith 33387d4246cSBarry Smith PetscFunctionBegin; 3349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3359566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 33787d4246cSBarry Smith PetscFunctionReturn(0); 33887d4246cSBarry Smith } 33987d4246cSBarry Smith 340bd04181cSBarry Smith /* 341bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 342bd04181cSBarry Smith 343bd04181cSBarry Smith - a single row of values is set with each call 344bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 345bd04181cSBarry Smith - the values are always added to the matrix, not set 346bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 347bd04181cSBarry Smith 3481f763a69SBarry Smith This does NOT assume the global column indices are sorted 349bd04181cSBarry Smith 3501f763a69SBarry Smith */ 351bd04181cSBarry Smith 352af0996ceSBarry Smith #include <petsc/private/isimpl.h> 353d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 354d71ae5a4SJacob Faibussowitsch { 355189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3561f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3571f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3581f763a69SBarry Smith PetscInt lastcol = -1; 359fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 360189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 361189e4007SBarry Smith 362fff043a9SJunchao Zhang PetscFunctionBegin; 3639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 364f38dd0b8SBarry Smith row = ridx[im[0]]; 3651f763a69SBarry Smith rp = aj + ai[row]; 3661f763a69SBarry Smith ap = aa + ai[row]; 3671f763a69SBarry Smith nrow = ailen[row]; 368189e4007SBarry Smith low = 0; 369189e4007SBarry Smith high = nrow; 370189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 371189e4007SBarry Smith col = cidx[in[l]]; 372f38dd0b8SBarry Smith value = v[l]; 373189e4007SBarry Smith 374189e4007SBarry Smith if (col <= lastcol) low = 0; 375189e4007SBarry Smith else high = nrow; 376189e4007SBarry Smith lastcol = col; 377189e4007SBarry Smith while (high - low > 5) { 378189e4007SBarry Smith t = (low + high) / 2; 379189e4007SBarry Smith if (rp[t] > col) high = t; 380189e4007SBarry Smith else low = t; 381189e4007SBarry Smith } 382189e4007SBarry Smith for (i = low; i < high; i++) { 383189e4007SBarry Smith if (rp[i] == col) { 3841f763a69SBarry Smith ap[i] += value; 385189e4007SBarry Smith low = i + 1; 3861f763a69SBarry Smith break; 387189e4007SBarry Smith } 388189e4007SBarry Smith } 389189e4007SBarry Smith } 3909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 391f38dd0b8SBarry Smith return 0; 392189e4007SBarry Smith } 393189e4007SBarry Smith 394d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 395d71ae5a4SJacob Faibussowitsch { 396416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 397e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 39897f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 399e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 400ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 401ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 402ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 40317ab2063SBarry Smith 4043a40ed3dSBarry Smith PetscFunctionBegin; 4059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 40617ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 407416022c9SBarry Smith row = im[k]; 4085ef9f2a5SBarry Smith if (row < 0) continue; 4096bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 410720833daSHong Zhang rp = aj + ai[row]; 411876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 4129371c9d4SSatish Balay rmax = imax[row]; 4139371c9d4SSatish Balay nrow = ailen[row]; 414416022c9SBarry Smith low = 0; 415c71e6ed7SBarry Smith high = nrow; 41617ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4175ef9f2a5SBarry Smith if (in[l] < 0) continue; 4186bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 419bfeeae90SHong Zhang col = in[l]; 420071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 421071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 42236db0b34SBarry Smith 4232205254eSKarl Rupp if (col <= lastcol) low = 0; 4242205254eSKarl Rupp else high = nrow; 425e2ee6c50SBarry Smith lastcol = col; 426416022c9SBarry Smith while (high - low > 5) { 427416022c9SBarry Smith t = (low + high) / 2; 428416022c9SBarry Smith if (rp[t] > col) high = t; 429416022c9SBarry Smith else low = t; 43017ab2063SBarry Smith } 431416022c9SBarry Smith for (i = low; i < high; i++) { 43217ab2063SBarry Smith if (rp[i] > col) break; 43317ab2063SBarry Smith if (rp[i] == col) { 434876c6284SHong Zhang if (!A->structure_only) { 4350c0d7e18SFande Kong if (is == ADD_VALUES) { 4360c0d7e18SFande Kong ap[i] += value; 4370c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4389371c9d4SSatish Balay } else ap[i] = value; 439720833daSHong Zhang } 440e44c0bd4SBarry Smith low = i + 1; 44117ab2063SBarry Smith goto noinsert; 44217ab2063SBarry Smith } 44317ab2063SBarry Smith } 444dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 445c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 44608401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 447720833daSHong Zhang if (A->structure_only) { 448876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 449720833daSHong Zhang } else { 450fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 451720833daSHong Zhang } 4529371c9d4SSatish Balay N = nrow++ - 1; 4539371c9d4SSatish Balay a->nz++; 4549371c9d4SSatish Balay high++; 455416022c9SBarry Smith /* shift up all the later entries in this row */ 4569566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 45717ab2063SBarry Smith rp[i] = col; 458580bdb30SBarry Smith if (!A->structure_only) { 4599566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 460580bdb30SBarry Smith ap[i] = value; 461580bdb30SBarry Smith } 462416022c9SBarry Smith low = i + 1; 463e56f5c9eSBarry Smith A->nonzerostate++; 464e44c0bd4SBarry Smith noinsert:; 46517ab2063SBarry Smith } 46617ab2063SBarry Smith ailen[row] = nrow; 46717ab2063SBarry Smith } 4689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4693a40ed3dSBarry Smith PetscFunctionReturn(0); 47017ab2063SBarry Smith } 47117ab2063SBarry Smith 472d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 473d71ae5a4SJacob Faibussowitsch { 47419b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 47519b08ed1SBarry Smith PetscInt *rp, k, row; 47619b08ed1SBarry Smith PetscInt *ai = a->i; 47719b08ed1SBarry Smith PetscInt *aj = a->j; 478fff043a9SJunchao Zhang MatScalar *aa, *ap; 47919b08ed1SBarry Smith 48019b08ed1SBarry Smith PetscFunctionBegin; 48128b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 48208401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 483fff043a9SJunchao Zhang 4849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 48519b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 48619b08ed1SBarry Smith row = im[k]; 48719b08ed1SBarry Smith rp = aj + ai[row]; 48819b08ed1SBarry Smith ap = aa + ai[row]; 48919b08ed1SBarry Smith 4909566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49119b08ed1SBarry Smith if (!A->structure_only) { 49219b08ed1SBarry Smith if (v) { 4939566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 49419b08ed1SBarry Smith v += n; 49519b08ed1SBarry Smith } else { 4969566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 49719b08ed1SBarry Smith } 49819b08ed1SBarry Smith } 49919b08ed1SBarry Smith a->ilen[row] = n; 50019b08ed1SBarry Smith a->imax[row] = n; 50119b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 50219b08ed1SBarry Smith a->nz += n; 50319b08ed1SBarry Smith } 5049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 50519b08ed1SBarry Smith PetscFunctionReturn(0); 50619b08ed1SBarry Smith } 50719b08ed1SBarry Smith 50819b08ed1SBarry Smith /*@ 50919b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51019b08ed1SBarry Smith 51119b08ed1SBarry Smith Input Parameters: 51211a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 51319b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 51419b08ed1SBarry Smith 51519b08ed1SBarry Smith Level: advanced 51619b08ed1SBarry Smith 51719b08ed1SBarry Smith Notes: 51819b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 51911a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52019b08ed1SBarry Smith as always with multiple matrix assemblies. 52119b08ed1SBarry Smith 522db781477SPatrick Sanan .seealso: `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 52319b08ed1SBarry Smith @*/ 52419b08ed1SBarry Smith 525d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 526d71ae5a4SJacob Faibussowitsch { 52719b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 52819b08ed1SBarry Smith 52919b08ed1SBarry Smith PetscFunctionBegin; 5309566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5319566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53219b08ed1SBarry Smith a->maxnz = nztotal; 5334dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 53419b08ed1SBarry Smith if (!a->ilen) { 5359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 53619b08ed1SBarry Smith } else { 5379566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 53819b08ed1SBarry Smith } 53919b08ed1SBarry Smith 54019b08ed1SBarry Smith /* allocate the matrix space */ 54119b08ed1SBarry Smith if (A->structure_only) { 5429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal, &a->j)); 5439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i)); 54419b08ed1SBarry Smith } else { 5459566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i)); 54619b08ed1SBarry Smith } 54719b08ed1SBarry Smith a->i[0] = 0; 54819b08ed1SBarry Smith if (A->structure_only) { 54919b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 55019b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55119b08ed1SBarry Smith } else { 55219b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 55319b08ed1SBarry Smith a->free_a = PETSC_TRUE; 55419b08ed1SBarry Smith } 55519b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 55619b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 55719b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 55819b08ed1SBarry Smith PetscFunctionReturn(0); 55919b08ed1SBarry Smith } 56019b08ed1SBarry Smith 561d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 562d71ae5a4SJacob Faibussowitsch { 563071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 564071fcb05SBarry Smith PetscInt *rp, k, row; 565071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 566071fcb05SBarry Smith PetscInt *aj = a->j; 567fff043a9SJunchao Zhang MatScalar *aa, *ap; 568071fcb05SBarry Smith 569071fcb05SBarry Smith PetscFunctionBegin; 5709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 571071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 572071fcb05SBarry Smith row = im[k]; 5736bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 574071fcb05SBarry Smith rp = aj + ai[row]; 575071fcb05SBarry Smith ap = aa + ai[row]; 57648a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 577071fcb05SBarry Smith if (!A->structure_only) { 578071fcb05SBarry Smith if (v) { 5799566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 580071fcb05SBarry Smith v += n; 581071fcb05SBarry Smith } else { 5829566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 583071fcb05SBarry Smith } 584071fcb05SBarry Smith } 585071fcb05SBarry Smith ailen[row] = n; 586071fcb05SBarry Smith a->nz += n; 587071fcb05SBarry Smith } 5889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 589071fcb05SBarry Smith PetscFunctionReturn(0); 590071fcb05SBarry Smith } 591071fcb05SBarry Smith 592d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 593d71ae5a4SJacob Faibussowitsch { 5947eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 59597f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59697f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 597fff043a9SJunchao Zhang MatScalar *ap, *aa; 5987eb43aa7SLois Curfman McInnes 5993a40ed3dSBarry Smith PetscFunctionBegin; 6009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 6017eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6027eb43aa7SLois Curfman McInnes row = im[k]; 6039371c9d4SSatish Balay if (row < 0) { 6049371c9d4SSatish Balay v += n; 6059371c9d4SSatish Balay continue; 6069371c9d4SSatish Balay } /* negative row */ 60754c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6089371c9d4SSatish Balay rp = aj + ai[row]; 6099371c9d4SSatish Balay ap = aa + ai[row]; 6107eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6117eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6129371c9d4SSatish Balay if (in[l] < 0) { 6139371c9d4SSatish Balay v++; 6149371c9d4SSatish Balay continue; 6159371c9d4SSatish Balay } /* negative column */ 61654c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 617bfeeae90SHong Zhang col = in[l]; 6189371c9d4SSatish Balay high = nrow; 6199371c9d4SSatish Balay low = 0; /* assume unsorted */ 6207eb43aa7SLois Curfman McInnes while (high - low > 5) { 6217eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6227eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6237eb43aa7SLois Curfman McInnes else low = t; 6247eb43aa7SLois Curfman McInnes } 6257eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6267eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6277eb43aa7SLois Curfman McInnes if (rp[i] == col) { 628b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6297eb43aa7SLois Curfman McInnes goto finished; 6307eb43aa7SLois Curfman McInnes } 6317eb43aa7SLois Curfman McInnes } 63297e567efSBarry Smith *v++ = 0.0; 6337eb43aa7SLois Curfman McInnes finished:; 6347eb43aa7SLois Curfman McInnes } 6357eb43aa7SLois Curfman McInnes } 6369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 6373a40ed3dSBarry Smith PetscFunctionReturn(0); 6387eb43aa7SLois Curfman McInnes } 6397eb43aa7SLois Curfman McInnes 640d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 641d71ae5a4SJacob Faibussowitsch { 6423ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 643c898d852SStefano Zampini const PetscScalar *av; 6443ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6453ea6fe3dSLisandro Dalcin PetscInt *rowlens; 64617ab2063SBarry Smith 6473a40ed3dSBarry Smith PetscFunctionBegin; 6489566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6492205254eSKarl Rupp 6503ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6513ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6523ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6533ea6fe3dSLisandro Dalcin nz = A->nz; 654416022c9SBarry Smith 6553ea6fe3dSLisandro Dalcin /* write matrix header */ 6563ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6579371c9d4SSatish Balay header[1] = M; 6589371c9d4SSatish Balay header[2] = N; 6599371c9d4SSatish Balay header[3] = nz; 6609566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 661416022c9SBarry Smith 6623ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6643ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6659566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6669566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6673ea6fe3dSLisandro Dalcin /* store column indices */ 6689566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 669416022c9SBarry Smith /* store nonzero values */ 6709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6719566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 673b37d52dbSMark F. Adams 6743ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6759566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6763a40ed3dSBarry Smith PetscFunctionReturn(0); 67717ab2063SBarry Smith } 678416022c9SBarry Smith 679d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 680d71ae5a4SJacob Faibussowitsch { 6817dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6827dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6837dc0baabSHong Zhang 6847dc0baabSHong Zhang PetscFunctionBegin; 6859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6867dc0baabSHong Zhang for (i = 0; i < m; i++) { 6879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 68848a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6907dc0baabSHong Zhang } 6919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6927dc0baabSHong Zhang PetscFunctionReturn(0); 6937dc0baabSHong Zhang } 6947dc0baabSHong Zhang 69509573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 696cd155464SBarry Smith 697d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 698d71ae5a4SJacob Faibussowitsch { 699416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 700c898d852SStefano Zampini const PetscScalar *av; 70160e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 702e060cb09SBarry Smith const char *name; 703f3ef73ceSBarry Smith PetscViewerFormat format; 70417ab2063SBarry Smith 7053a40ed3dSBarry Smith PetscFunctionBegin; 7067dc0baabSHong Zhang if (A->structure_only) { 7079566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7087dc0baabSHong Zhang PetscFunctionReturn(0); 7097dc0baabSHong Zhang } 71043e49210SHong Zhang 7119566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 7122e5835c6SStefano Zampini if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 7132e5835c6SStefano Zampini 714c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 71771c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 71897f1f81fSBarry Smith PetscInt nofinalvalue = 0; 71960e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 720c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 721d00d2cf4SBarry Smith nofinalvalue = 1; 722d00d2cf4SBarry Smith } 7239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 726fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 728fbfe6fa7SJed Brown #else 7299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 730fbfe6fa7SJed Brown #endif 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73217ab2063SBarry Smith 73317ab2063SBarry Smith for (i = 0; i < m; i++) { 73460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 735aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 73717ab2063SBarry Smith #else 7389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 73917ab2063SBarry Smith #endif 74017ab2063SBarry Smith } 74117ab2063SBarry Smith } 742d00d2cf4SBarry Smith if (nofinalvalue) { 743c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 745c337ccceSJed Brown #else 7469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 747c337ccceSJed Brown #endif 748d00d2cf4SBarry Smith } 7499566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 752fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 75444cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 75660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 757aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 75836db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76036db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76236db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7646831982aSBarry Smith } 76544cd7ae7SLois Curfman McInnes #else 7669566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 76744cd7ae7SLois Curfman McInnes #endif 76844cd7ae7SLois Curfman McInnes } 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77044cd7ae7SLois Curfman McInnes } 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 772fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 77397f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 776496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 777496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 77860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 779496be53dSLois Curfman McInnes if (a->j[j] >= i) { 780aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78136db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 782496be53dSLois Curfman McInnes #else 783496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 784496be53dSLois Curfman McInnes #endif 785496be53dSLois Curfman McInnes } 786496be53dSLois Curfman McInnes } 787496be53dSLois Curfman McInnes } 7882e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7902e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7912205254eSKarl Rupp if (i + 4 < m) { 7929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 7932205254eSKarl Rupp } else if (i + 3 < m) { 7949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 7952205254eSKarl Rupp } else if (i + 2 < m) { 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 7972205254eSKarl Rupp } else if (i + 1 < m) { 7989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 7992205254eSKarl Rupp } else if (i < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8012205254eSKarl Rupp } else { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8032205254eSKarl Rupp } 804496be53dSLois Curfman McInnes } 8059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8069566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 807496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 80860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8099566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 810496be53dSLois Curfman McInnes } 8119566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 812496be53dSLois Curfman McInnes } 8139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 814496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 816496be53dSLois Curfman McInnes if (a->j[j] >= i) { 817aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 81848a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 819496be53dSLois Curfman McInnes #else 8209566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 821496be53dSLois Curfman McInnes #endif 822496be53dSLois Curfman McInnes } 823496be53dSLois Curfman McInnes } 8249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 825496be53dSLois Curfman McInnes } 8269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 827fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 82897f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 82987828ca2SBarry Smith PetscScalar value; 83068f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83168f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83268f1ed48SBarry Smith 83368f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 83468f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 83568f1ed48SBarry Smith realonly = PETSC_FALSE; 83668f1ed48SBarry Smith break; 83768f1ed48SBarry Smith } 83868f1ed48SBarry Smith } 83968f1ed48SBarry Smith #endif 84002594712SBarry Smith 8419566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84202594712SBarry Smith for (i = 0; i < m; i++) { 84302594712SBarry Smith jcnt = 0; 844d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 845e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 84602594712SBarry Smith value = a->a[cnt++]; 847e24b481bSBarry Smith jcnt++; 84802594712SBarry Smith } else { 84902594712SBarry Smith value = 0.0; 85002594712SBarry Smith } 851aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85268f1ed48SBarry Smith if (realonly) { 8539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 85468f1ed48SBarry Smith } else { 8559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 85668f1ed48SBarry Smith } 85702594712SBarry Smith #else 8589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 85902594712SBarry Smith #endif 86002594712SBarry Smith } 8619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86202594712SBarry Smith } 8639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8643c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 865150b93efSMatthew G. Knepley PetscInt fshift = 1; 8669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8673c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8693c215bfdSMatthew Knepley #else 8709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8713c215bfdSMatthew Knepley #endif 8729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8733c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 87460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8773c215bfdSMatthew Knepley #else 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8793c215bfdSMatthew Knepley #endif 8803c215bfdSMatthew Knepley } 8813c215bfdSMatthew Knepley } 8829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8833a40ed3dSBarry Smith } else { 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 885d5f3da31SBarry Smith if (A->factortype) { 88616cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 88816cd7e1dSShri Abhyankar /* L part */ 88960e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89116cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 89316cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 89516cd7e1dSShri Abhyankar } else { 8969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 89716cd7e1dSShri Abhyankar } 89816cd7e1dSShri Abhyankar #else 8999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90016cd7e1dSShri Abhyankar #endif 90116cd7e1dSShri Abhyankar } 90216cd7e1dSShri Abhyankar /* diagonal */ 90316cd7e1dSShri Abhyankar j = a->diag[i]; 90416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 90516cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 90716cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 90916cd7e1dSShri Abhyankar } else { 9109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91116cd7e1dSShri Abhyankar } 91216cd7e1dSShri Abhyankar #else 9139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 91416cd7e1dSShri Abhyankar #endif 91516cd7e1dSShri Abhyankar 91616cd7e1dSShri Abhyankar /* U part */ 91760e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 91816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9229566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 92316cd7e1dSShri Abhyankar } else { 9249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 92516cd7e1dSShri Abhyankar } 92616cd7e1dSShri Abhyankar #else 9279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 92816cd7e1dSShri Abhyankar #endif 92916cd7e1dSShri Abhyankar } 9309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93116cd7e1dSShri Abhyankar } 93216cd7e1dSShri Abhyankar } else { 93317ab2063SBarry Smith for (i = 0; i < m; i++) { 9349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 93560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 936aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 93736db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 93936db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9413a40ed3dSBarry Smith } else { 9429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 94317ab2063SBarry Smith } 94417ab2063SBarry Smith #else 9459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 94617ab2063SBarry Smith #endif 94717ab2063SBarry Smith } 9489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 94917ab2063SBarry Smith } 95016cd7e1dSShri Abhyankar } 9519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95217ab2063SBarry Smith } 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9543a40ed3dSBarry Smith PetscFunctionReturn(0); 955416022c9SBarry Smith } 956416022c9SBarry Smith 9579804daf3SBarry Smith #include <petscdraw.h> 958d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 959d71ae5a4SJacob Faibussowitsch { 960480ef9eaSBarry Smith Mat A = (Mat)Aa; 961416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 962383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 963383922c3SLisandro Dalcin int color; 964b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 965b0a32e0cSBarry Smith PetscViewer viewer; 966f3ef73ceSBarry Smith PetscViewerFormat format; 967fff043a9SJunchao Zhang const PetscScalar *aa; 968cddf8d76SBarry Smith 9693a40ed3dSBarry Smith PetscFunctionBegin; 9709566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9719566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9729566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 973383922c3SLisandro Dalcin 974416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 976fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 977d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9780513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 979b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 980416022c9SBarry Smith for (i = 0; i < m; i++) { 9819371c9d4SSatish Balay y_l = m - i - 1.0; 9829371c9d4SSatish Balay y_r = y_l + 1.0; 983bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9849371c9d4SSatish Balay x_l = a->j[j]; 9859371c9d4SSatish Balay x_r = x_l + 1.0; 986fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9879566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 988cddf8d76SBarry Smith } 989cddf8d76SBarry Smith } 990b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 991cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9929371c9d4SSatish Balay y_l = m - i - 1.0; 9939371c9d4SSatish Balay y_r = y_l + 1.0; 994bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9959371c9d4SSatish Balay x_l = a->j[j]; 9969371c9d4SSatish Balay x_r = x_l + 1.0; 997fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 9989566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 999cddf8d76SBarry Smith } 1000cddf8d76SBarry Smith } 1001b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1002cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10039371c9d4SSatish Balay y_l = m - i - 1.0; 10049371c9d4SSatish Balay y_r = y_l + 1.0; 1005bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10069371c9d4SSatish Balay x_l = a->j[j]; 10079371c9d4SSatish Balay x_r = x_l + 1.0; 1008fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10099566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1010416022c9SBarry Smith } 1011416022c9SBarry Smith } 1012d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10130513a670SBarry Smith } else { 10140513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10150513a670SBarry Smith /* first determine max of all nonzero values */ 1016b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1017383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1018b0a32e0cSBarry Smith PetscDraw popup; 10190513a670SBarry Smith 10200513a670SBarry Smith for (i = 0; i < nz; i++) { 1021fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10220513a670SBarry Smith } 1023383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10249566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10259566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1026383922c3SLisandro Dalcin 1027d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10280513a670SBarry Smith for (i = 0; i < m; i++) { 1029383922c3SLisandro Dalcin y_l = m - i - 1.0; 1030383922c3SLisandro Dalcin y_r = y_l + 1.0; 1031bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1032383922c3SLisandro Dalcin x_l = a->j[j]; 1033383922c3SLisandro Dalcin x_r = x_l + 1.0; 1034fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10359566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10360513a670SBarry Smith count++; 10370513a670SBarry Smith } 10380513a670SBarry Smith } 1039d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10400513a670SBarry Smith } 10419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1042480ef9eaSBarry Smith PetscFunctionReturn(0); 1043480ef9eaSBarry Smith } 1044cddf8d76SBarry Smith 10459804daf3SBarry Smith #include <petscdraw.h> 1046d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1047d71ae5a4SJacob Faibussowitsch { 1048b0a32e0cSBarry Smith PetscDraw draw; 104936db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1050ace3abfcSBarry Smith PetscBool isnull; 1051480ef9eaSBarry Smith 1052480ef9eaSBarry Smith PetscFunctionBegin; 10539566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10549566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 1055480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 1056480ef9eaSBarry Smith 10579371c9d4SSatish Balay xr = A->cmap->n; 10589371c9d4SSatish Balay yr = A->rmap->n; 10599371c9d4SSatish Balay h = yr / 10.0; 10609371c9d4SSatish Balay w = xr / 10.0; 10619371c9d4SSatish Balay xr += w; 10629371c9d4SSatish Balay yr += h; 10639371c9d4SSatish Balay xl = -w; 10649371c9d4SSatish Balay yl = -h; 10659566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10669566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10679566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10689566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10699566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10703a40ed3dSBarry Smith PetscFunctionReturn(0); 1071416022c9SBarry Smith } 1072416022c9SBarry Smith 1073d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1074d71ae5a4SJacob Faibussowitsch { 1075ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1076416022c9SBarry Smith 10773a40ed3dSBarry Smith PetscFunctionBegin; 10789566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10799566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10809566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10811baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10821baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10831baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10849566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10853a40ed3dSBarry Smith PetscFunctionReturn(0); 108617ab2063SBarry Smith } 108719bcc07fSBarry Smith 1088d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1089d71ae5a4SJacob Faibussowitsch { 1090416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1091580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1092d0f46423SBarry Smith PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0; 109354f21887SBarry Smith MatScalar *aa = a->a, *ap; 10943447b6efSHong Zhang PetscReal ratio = 0.6; 109517ab2063SBarry Smith 10963a40ed3dSBarry Smith PetscFunctionBegin; 10973a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 10989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1099b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1100b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11019566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 1102b215bc84SStefano Zampini PetscFunctionReturn(0); 1103b215bc84SStefano Zampini } 110417ab2063SBarry Smith 110543ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 110617ab2063SBarry Smith for (i = 1; i < m; i++) { 1107416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 110817ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 110994a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111017ab2063SBarry Smith if (fshift) { 1111bfeeae90SHong Zhang ip = aj + ai[i]; 1112bfeeae90SHong Zhang ap = aa + ai[i]; 111317ab2063SBarry Smith N = ailen[i]; 11149566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 111548a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 111617ab2063SBarry Smith } 111717ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 111817ab2063SBarry Smith } 111917ab2063SBarry Smith if (m) { 112017ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112117ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112217ab2063SBarry Smith } 11237b083b7cSBarry Smith 112417ab2063SBarry Smith /* reset ilen and imax for each row */ 11257b083b7cSBarry Smith a->nonzerorowcnt = 0; 1126396832f4SHong Zhang if (A->structure_only) { 11279566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11289566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1129396832f4SHong Zhang } else { /* !A->structure_only */ 113017ab2063SBarry Smith for (i = 0; i < m; i++) { 113117ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11327b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113317ab2063SBarry Smith } 1134396832f4SHong Zhang } 1135bfeeae90SHong Zhang a->nz = ai[m]; 1136aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 113717ab2063SBarry Smith 11389566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 11399566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11409566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11419566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11422205254eSKarl Rupp 11438e58a170SBarry Smith A->info.mallocs += a->reallocs; 1144dd5f02e7SSatish Balay a->reallocs = 0; 11456712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 114636db0b34SBarry Smith a->rmax = rmax; 11474e220ebcSLois Curfman McInnes 114848a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11499566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11503a40ed3dSBarry Smith PetscFunctionReturn(0); 115117ab2063SBarry Smith } 115217ab2063SBarry Smith 1153d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1154d71ae5a4SJacob Faibussowitsch { 115599cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 115699cafbc1SBarry Smith PetscInt i, nz = a->nz; 11572e5835c6SStefano Zampini MatScalar *aa; 115899cafbc1SBarry Smith 115999cafbc1SBarry Smith PetscFunctionBegin; 11609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 116199cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 116499cafbc1SBarry Smith PetscFunctionReturn(0); 116599cafbc1SBarry Smith } 116699cafbc1SBarry Smith 1167d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1168d71ae5a4SJacob Faibussowitsch { 116999cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 117099cafbc1SBarry Smith PetscInt i, nz = a->nz; 11712e5835c6SStefano Zampini MatScalar *aa; 117299cafbc1SBarry Smith 117399cafbc1SBarry Smith PetscFunctionBegin; 11749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117599cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 117899cafbc1SBarry Smith PetscFunctionReturn(0); 117999cafbc1SBarry Smith } 118099cafbc1SBarry Smith 1181d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1182d71ae5a4SJacob Faibussowitsch { 1183fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1184fff043a9SJunchao Zhang MatScalar *aa; 11853a40ed3dSBarry Smith 11863a40ed3dSBarry Smith PetscFunctionBegin; 11879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 11889566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 11899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 11909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11913a40ed3dSBarry Smith PetscFunctionReturn(0); 119217ab2063SBarry Smith } 1193416022c9SBarry Smith 1194d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatResetPreallocationCOO_SeqAIJ(Mat A) 1195d71ae5a4SJacob Faibussowitsch { 1196cbc6b225SStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1197cbc6b225SStefano Zampini 1198cbc6b225SStefano Zampini PetscFunctionBegin; 11999566063dSJacob Faibussowitsch PetscCall(PetscFree(a->perm)); 12009566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jmap)); 1201cbc6b225SStefano Zampini PetscFunctionReturn(0); 1202cbc6b225SStefano Zampini } 1203cbc6b225SStefano Zampini 1204d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1205d71ae5a4SJacob Faibussowitsch { 1206416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1207d5d45c9bSBarry Smith 12083a40ed3dSBarry Smith PetscFunctionBegin; 1209aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1210c0aa6a63SJacob Faibussowitsch PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz); 121117ab2063SBarry Smith #endif 12129566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12139566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(A)); 12149566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12159566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12169566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12179566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12189566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12199566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12209566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12219566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12229566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12239566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12259566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12269566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1228901853e0SKris Buschelman 12296718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12306718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12316718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12326718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12336718818eSStefano Zampini due to different matrix sizes */ 12349566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12356718818eSStefano Zampini 12369566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12372e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12382e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12452e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12462e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12472e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12482e956fe4SStefano Zampini #endif 12494222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12534222ddf1SHong Zhang #endif 12543d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12563d0639e7SStefano Zampini #endif 12579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1258af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1260af8000cdSHong Zhang #endif 1261d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1263d24d4204SJose E. Roman #endif 126463c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 126763c07aadSStefano Zampini #endif 12689566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12722e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12832e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12842e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12852e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12862e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 12872e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 12882e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 12892e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 12903a40ed3dSBarry Smith PetscFunctionReturn(0); 129117ab2063SBarry Smith } 129217ab2063SBarry Smith 1293d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1294d71ae5a4SJacob Faibussowitsch { 1295416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 12963a40ed3dSBarry Smith 12973a40ed3dSBarry Smith PetscFunctionBegin; 1298a65d3064SKris Buschelman switch (op) { 1299d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1300d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1301d71ae5a4SJacob Faibussowitsch break; 1302d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1303d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1304d71ae5a4SJacob Faibussowitsch break; 1305d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1306d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1307d71ae5a4SJacob Faibussowitsch break; 1308d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1309d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1310d71ae5a4SJacob Faibussowitsch break; 1311d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1312d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1313d71ae5a4SJacob Faibussowitsch break; 1314d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1315d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1316d71ae5a4SJacob Faibussowitsch break; 1317d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1318d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1319d71ae5a4SJacob Faibussowitsch break; 13203d472b54SHong Zhang case MAT_SPD: 1321b1646e73SJed Brown case MAT_SYMMETRIC: 1322b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1323b1646e73SJed Brown case MAT_HERMITIAN: 1324b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1325957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1326b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1327b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1328b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13295021d80fSJed Brown break; 13308c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1331a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1332d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1333d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1334d71ae5a4SJacob Faibussowitsch break; 1335d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1336d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1337d71ae5a4SJacob Faibussowitsch break; 1338d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1339d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1340d71ae5a4SJacob Faibussowitsch break; 1341071fcb05SBarry Smith case MAT_SORTED_FULL: 1342071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1343071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1344071fcb05SBarry Smith break; 1345d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1346d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1347d71ae5a4SJacob Faibussowitsch break; 1348d71ae5a4SJacob Faibussowitsch default: 1349d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1350a65d3064SKris Buschelman } 13513a40ed3dSBarry Smith PetscFunctionReturn(0); 135217ab2063SBarry Smith } 135317ab2063SBarry Smith 1354d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1355d71ae5a4SJacob Faibussowitsch { 1356416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1357fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1358c898d852SStefano Zampini PetscScalar *x; 1359c898d852SStefano Zampini const PetscScalar *aa; 136017ab2063SBarry Smith 13613a40ed3dSBarry Smith PetscFunctionBegin; 13629566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 136308401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1365d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1366d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13679566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13682c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13699566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 137135e7444dSHong Zhang PetscFunctionReturn(0); 137235e7444dSHong Zhang } 137335e7444dSHong Zhang 13749566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 137535e7444dSHong Zhang for (i = 0; i < n; i++) { 1376fdc842d1SBarry Smith x[i] = 0.0; 137735e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 137835e7444dSHong Zhang if (aj[j] == i) { 137935e7444dSHong Zhang x[i] = aa[j]; 138017ab2063SBarry Smith break; 138117ab2063SBarry Smith } 138217ab2063SBarry Smith } 138317ab2063SBarry Smith } 13849566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13863a40ed3dSBarry Smith PetscFunctionReturn(0); 138717ab2063SBarry Smith } 138817ab2063SBarry Smith 1389c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1390d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1391d71ae5a4SJacob Faibussowitsch { 1392416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13935f22a7b3SSebastian Grimberg const MatScalar *aa; 1394d9ca1df4SBarry Smith PetscScalar *y; 1395d9ca1df4SBarry Smith const PetscScalar *x; 1396d0f46423SBarry Smith PetscInt m = A->rmap->n; 13975c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 13985f22a7b3SSebastian Grimberg const MatScalar *v; 1399a77337e4SBarry Smith PetscScalar alpha; 1400d9ca1df4SBarry Smith PetscInt n, i, j; 1401d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14023447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1403ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14045c897100SBarry Smith #endif 140517ab2063SBarry Smith 14063a40ed3dSBarry Smith PetscFunctionBegin; 14079566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14089566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14099566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14115c897100SBarry Smith 14125c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1413fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14145c897100SBarry Smith #else 14153447b6efSHong Zhang if (usecprow) { 14163447b6efSHong Zhang m = cprow.nrows; 14173447b6efSHong Zhang ii = cprow.i; 14187b2bb3b9SHong Zhang ridx = cprow.rindex; 14193447b6efSHong Zhang } else { 14203447b6efSHong Zhang ii = a->i; 14213447b6efSHong Zhang } 142217ab2063SBarry Smith for (i = 0; i < m; i++) { 14233447b6efSHong Zhang idx = a->j + ii[i]; 1424fff043a9SJunchao Zhang v = aa + ii[i]; 14253447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14263447b6efSHong Zhang if (usecprow) { 14277b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14283447b6efSHong Zhang } else { 142917ab2063SBarry Smith alpha = x[i]; 14303447b6efSHong Zhang } 143104fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 143217ab2063SBarry Smith } 14335c897100SBarry Smith #endif 14349566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14359566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14369566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14383a40ed3dSBarry Smith PetscFunctionReturn(0); 143917ab2063SBarry Smith } 144017ab2063SBarry Smith 1441d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1442d71ae5a4SJacob Faibussowitsch { 14435c897100SBarry Smith PetscFunctionBegin; 14449566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14459566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14465c897100SBarry Smith PetscFunctionReturn(0); 14475c897100SBarry Smith } 14485c897100SBarry Smith 1449c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 145078b84d54SShri Abhyankar 1451d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1452d71ae5a4SJacob Faibussowitsch { 1453416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1454d9fead3dSBarry Smith PetscScalar *y; 145554f21887SBarry Smith const PetscScalar *x; 1456fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1457003131ecSBarry Smith PetscInt m = A->rmap->n; 14580298fd71SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 14597b083b7cSBarry Smith PetscInt n, i; 1460362ced78SSatish Balay PetscScalar sum; 1461ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 146217ab2063SBarry Smith 1463b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 146497952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1465fee21e36SBarry Smith #endif 1466fee21e36SBarry Smith 14673a40ed3dSBarry Smith PetscFunctionBegin; 1468b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14699566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 1470b215bc84SStefano Zampini PetscFunctionReturn(0); 1471b215bc84SStefano Zampini } 14729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14739566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14749566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1475416022c9SBarry Smith ii = a->i; 14764eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14779566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 147897952fefSHong Zhang m = a->compressedrow.nrows; 147997952fefSHong Zhang ii = a->compressedrow.i; 148097952fefSHong Zhang ridx = a->compressedrow.rindex; 148197952fefSHong Zhang for (i = 0; i < m; i++) { 148297952fefSHong Zhang n = ii[i + 1] - ii[i]; 148397952fefSHong Zhang aj = a->j + ii[i]; 1484fff043a9SJunchao Zhang aa = a_a + ii[i]; 148597952fefSHong Zhang sum = 0.0; 1486003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1487003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 148897952fefSHong Zhang y[*ridx++] = sum; 148997952fefSHong Zhang } 149097952fefSHong Zhang } else { /* do not use compressed row format */ 1491b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 14923d3eaba7SBarry Smith aj = a->j; 1493fff043a9SJunchao Zhang aa = a_a; 1494b05257ddSBarry Smith fortranmultaij_(&m, x, ii, aj, aa, y); 1495b05257ddSBarry Smith #else 149617ab2063SBarry Smith for (i = 0; i < m; i++) { 1497003131ecSBarry Smith n = ii[i + 1] - ii[i]; 1498003131ecSBarry Smith aj = a->j + ii[i]; 1499fff043a9SJunchao Zhang aa = a_a + ii[i]; 150017ab2063SBarry Smith sum = 0.0; 1501003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 150217ab2063SBarry Smith y[i] = sum; 150317ab2063SBarry Smith } 15048d195f9aSBarry Smith #endif 1505b05257ddSBarry Smith } 15069566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15079566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15089566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15103a40ed3dSBarry Smith PetscFunctionReturn(0); 151117ab2063SBarry Smith } 151217ab2063SBarry Smith 1513d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1514d71ae5a4SJacob Faibussowitsch { 1515b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1516b434eb95SMatthew G. Knepley PetscScalar *y; 1517b434eb95SMatthew G. Knepley const PetscScalar *x; 1518fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1519b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1520b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1521b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1522b434eb95SMatthew G. Knepley PetscScalar sum; 1523b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1524b434eb95SMatthew G. Knepley 1525b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1526b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1527b434eb95SMatthew G. Knepley #endif 1528b434eb95SMatthew G. Knepley 1529b434eb95SMatthew G. Knepley PetscFunctionBegin; 15309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15319566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15329566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1533b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1534b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1535b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1536b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1537b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1538b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1539b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1540fff043a9SJunchao Zhang aa = a_a + ii[i]; 1541b434eb95SMatthew G. Knepley sum = 0.0; 1542b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1543b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1544b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1545b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1546b434eb95SMatthew G. Knepley } 1547b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15483d3eaba7SBarry Smith ii = a->i; 1549b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1550b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1551b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1552fff043a9SJunchao Zhang aa = a_a + ii[i]; 1553b434eb95SMatthew G. Knepley sum = 0.0; 1554b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1555b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1556b434eb95SMatthew G. Knepley y[i] = sum; 1557b434eb95SMatthew G. Knepley } 1558b434eb95SMatthew G. Knepley } 15599566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15609566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15619566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 1563b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1564b434eb95SMatthew G. Knepley } 1565b434eb95SMatthew G. Knepley 1566d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1567d71ae5a4SJacob Faibussowitsch { 1568b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1569b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1570b434eb95SMatthew G. Knepley const PetscScalar *x; 1571fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1572b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1573b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1574b434eb95SMatthew G. Knepley PetscScalar sum; 1575b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1576b434eb95SMatthew G. Knepley 1577b434eb95SMatthew G. Knepley PetscFunctionBegin; 15789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15809566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1581b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 158248a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1583b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1584b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1585b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1586b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1587b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1588b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1589fff043a9SJunchao Zhang aa = a_a + ii[i]; 1590b434eb95SMatthew G. Knepley sum = y[*ridx]; 1591b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1592b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1593b434eb95SMatthew G. Knepley } 1594b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15953d3eaba7SBarry Smith ii = a->i; 1596b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1597b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1598b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1599fff043a9SJunchao Zhang aa = a_a + ii[i]; 1600b434eb95SMatthew G. Knepley sum = y[i]; 1601b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1602b434eb95SMatthew G. Knepley z[i] = sum; 1603b434eb95SMatthew G. Knepley } 1604b434eb95SMatthew G. Knepley } 16059566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16069566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16079566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 1609b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1610b434eb95SMatthew G. Knepley } 1611b434eb95SMatthew G. Knepley 1612c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1613d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1614d71ae5a4SJacob Faibussowitsch { 1615416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1616f15663dcSBarry Smith PetscScalar *y, *z; 1617f15663dcSBarry Smith const PetscScalar *x; 1618fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1619d9ca1df4SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 1620d9ca1df4SBarry Smith PetscInt m = A->rmap->n, n, i; 1621362ced78SSatish Balay PetscScalar sum; 1622ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16239ea0dfa2SSatish Balay 16243a40ed3dSBarry Smith PetscFunctionBegin; 1625b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16269566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 1627b215bc84SStefano Zampini PetscFunctionReturn(0); 1628b215bc84SStefano Zampini } 16299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16309566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16319566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16324eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 163348a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 163497952fefSHong Zhang m = a->compressedrow.nrows; 163597952fefSHong Zhang ii = a->compressedrow.i; 163697952fefSHong Zhang ridx = a->compressedrow.rindex; 163797952fefSHong Zhang for (i = 0; i < m; i++) { 163897952fefSHong Zhang n = ii[i + 1] - ii[i]; 163997952fefSHong Zhang aj = a->j + ii[i]; 1640fff043a9SJunchao Zhang aa = a_a + ii[i]; 164197952fefSHong Zhang sum = y[*ridx]; 1642f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 164397952fefSHong Zhang z[*ridx++] = sum; 164497952fefSHong Zhang } 164597952fefSHong Zhang } else { /* do not use compressed row format */ 16463d3eaba7SBarry Smith ii = a->i; 1647f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16483d3eaba7SBarry Smith aj = a->j; 1649fff043a9SJunchao Zhang aa = a_a; 1650f15663dcSBarry Smith fortranmultaddaij_(&m, x, ii, aj, aa, y, z); 1651f15663dcSBarry Smith #else 165217ab2063SBarry Smith for (i = 0; i < m; i++) { 1653f15663dcSBarry Smith n = ii[i + 1] - ii[i]; 1654f15663dcSBarry Smith aj = a->j + ii[i]; 1655fff043a9SJunchao Zhang aa = a_a + ii[i]; 165617ab2063SBarry Smith sum = y[i]; 1657f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165817ab2063SBarry Smith z[i] = sum; 165917ab2063SBarry Smith } 166002ab625aSSatish Balay #endif 1661f15663dcSBarry Smith } 16629566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16639566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16649566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16663a40ed3dSBarry Smith PetscFunctionReturn(0); 166717ab2063SBarry Smith } 166817ab2063SBarry Smith 166917ab2063SBarry Smith /* 167017ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 167117ab2063SBarry Smith */ 1672d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1673d71ae5a4SJacob Faibussowitsch { 1674416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1675d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1676c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 167717ab2063SBarry Smith 16783a40ed3dSBarry Smith PetscFunctionBegin; 167909f38230SBarry Smith if (!a->diag) { 16809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1681c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 168209f38230SBarry Smith } 1683d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1684c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1685c0c07093SJunchao Zhang if (alreadySet) { 1686c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1687c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1688c0c07093SJunchao Zhang } 1689c0c07093SJunchao Zhang 169009f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1691bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1692bfeeae90SHong Zhang if (a->j[j] == i) { 169309f38230SBarry Smith a->diag[i] = j; 169417ab2063SBarry Smith break; 169517ab2063SBarry Smith } 169617ab2063SBarry Smith } 169717ab2063SBarry Smith } 16983a40ed3dSBarry Smith PetscFunctionReturn(0); 169917ab2063SBarry Smith } 170017ab2063SBarry Smith 1701d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1702d71ae5a4SJacob Faibussowitsch { 170361ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 170461ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 170561ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 170661ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 170761ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 170861ecd0c6SBarry Smith 170961ecd0c6SBarry Smith PetscFunctionBegin; 171061ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17129566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 171361ecd0c6SBarry Smith PetscFunctionReturn(0); 171461ecd0c6SBarry Smith } 171561ecd0c6SBarry Smith 171661ecd0c6SBarry Smith if (a->diagonaldense) { 171761ecd0c6SBarry Smith cnt = 0; 171861ecd0c6SBarry Smith } else { 17199566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 172061ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1721349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 172261ecd0c6SBarry Smith cnt++; 172361ecd0c6SBarry Smith mdiag[i] = 1; 172461ecd0c6SBarry Smith } 172561ecd0c6SBarry Smith } 172661ecd0c6SBarry Smith } 172761ecd0c6SBarry Smith if (!cnt) { 17289566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 172961ecd0c6SBarry Smith } else { 1730b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1731b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 173261ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij; 173361ecd0c6SBarry Smith 173461ecd0c6SBarry Smith a->a = NULL; 173561ecd0c6SBarry Smith a->j = NULL; 173661ecd0c6SBarry Smith a->i = NULL; 173761ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1738ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 174061ecd0c6SBarry Smith 174161ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 174261ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17439566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 174448a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1745447d62f5SStefano Zampini } 17469566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17479566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 174861ecd0c6SBarry Smith if (singlemalloc) { 17499566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda, oldj, oldi)); 175061ecd0c6SBarry Smith } else { 17519566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17529566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17539566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 175461ecd0c6SBarry Smith } 175561ecd0c6SBarry Smith } 17569566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 175761ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 175861ecd0c6SBarry Smith PetscFunctionReturn(0); 175961ecd0c6SBarry Smith } 176061ecd0c6SBarry Smith 1761be5855fcSBarry Smith /* 1762be5855fcSBarry Smith Checks for missing diagonals 1763be5855fcSBarry Smith */ 1764d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1765d71ae5a4SJacob Faibussowitsch { 1766be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17677734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1768be5855fcSBarry Smith 1769be5855fcSBarry Smith PetscFunctionBegin; 177009f38230SBarry Smith *missing = PETSC_FALSE; 17717734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 177209f38230SBarry Smith *missing = PETSC_TRUE; 177309f38230SBarry Smith if (d) *d = 0; 17749566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 177509f38230SBarry Smith } else { 177601445905SHong Zhang PetscInt n; 177701445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1778f1e2ffcdSBarry Smith diag = a->diag; 177901445905SHong Zhang for (i = 0; i < n; i++) { 17807734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 178109f38230SBarry Smith *missing = PETSC_TRUE; 178209f38230SBarry Smith if (d) *d = i; 17839566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1784358d2f5dSShri Abhyankar break; 178509f38230SBarry Smith } 1786be5855fcSBarry Smith } 1787be5855fcSBarry Smith } 1788be5855fcSBarry Smith PetscFunctionReturn(0); 1789be5855fcSBarry Smith } 1790be5855fcSBarry Smith 17910da83c2eSBarry Smith #include <petscblaslapack.h> 17920da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 17930da83c2eSBarry Smith 17940da83c2eSBarry Smith /* 17950da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 17960da83c2eSBarry Smith */ 1797d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1798d71ae5a4SJacob Faibussowitsch { 17990da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18000da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18010da83c2eSBarry Smith const PetscReal shift = 0.0; 18020da83c2eSBarry Smith PetscInt ipvt[5]; 18030da83c2eSBarry Smith PetscScalar work[25], *v_work; 18040da83c2eSBarry Smith 18050da83c2eSBarry Smith PetscFunctionBegin; 18060da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18070da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 180808401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1809ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18109566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 181148a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18120da83c2eSBarry Smith ncnt = 0; 18130da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18140da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18159566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18160da83c2eSBarry Smith switch (bsizes[i]) { 1817d71ae5a4SJacob Faibussowitsch case 1: 1818d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1819d71ae5a4SJacob Faibussowitsch break; 18200da83c2eSBarry Smith case 2: 18219566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18220da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18239566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18240da83c2eSBarry Smith break; 18250da83c2eSBarry Smith case 3: 18269566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18270da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18289566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18290da83c2eSBarry Smith break; 18300da83c2eSBarry Smith case 4: 18319566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18320da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18339566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18340da83c2eSBarry Smith break; 18350da83c2eSBarry Smith case 5: 18369566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18370da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18389566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18390da83c2eSBarry Smith break; 18400da83c2eSBarry Smith case 6: 18419566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18420da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18439566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18440da83c2eSBarry Smith break; 18450da83c2eSBarry Smith case 7: 18469566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18470da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18489566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18490da83c2eSBarry Smith break; 18500da83c2eSBarry Smith default: 18519566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18520da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18539566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18540da83c2eSBarry Smith } 18550da83c2eSBarry Smith ncnt += bsizes[i]; 18560da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 18570da83c2eSBarry Smith } 185848a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18599566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18600da83c2eSBarry Smith PetscFunctionReturn(0); 18610da83c2eSBarry Smith } 18620da83c2eSBarry Smith 1863422a814eSBarry Smith /* 1864422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1865422a814eSBarry Smith */ 1866d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1867d71ae5a4SJacob Faibussowitsch { 186871f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1869d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18702e5835c6SStefano Zampini const MatScalar *v; 187154f21887SBarry Smith PetscScalar *idiag, *mdiag; 187271f1c65dSBarry Smith 187371f1c65dSBarry Smith PetscFunctionBegin; 187471f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 18759566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 187671f1c65dSBarry Smith diag = a->diag; 18774dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18782e5835c6SStefano Zampini 187971f1c65dSBarry Smith mdiag = a->mdiag; 188071f1c65dSBarry Smith idiag = a->idiag; 18819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1882422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 188371f1c65dSBarry Smith for (i = 0; i < m; i++) { 188471f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1885899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1886899639b0SHong Zhang if (PetscRealPart(fshift)) { 18879566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 18887b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18897b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 18907b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 189198921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1892899639b0SHong Zhang } 189371f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 189471f1c65dSBarry Smith } 18959566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 189671f1c65dSBarry Smith } else { 189771f1c65dSBarry Smith for (i = 0; i < m; i++) { 189871f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 189971f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 190071f1c65dSBarry Smith } 19019566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 190271f1c65dSBarry Smith } 190371f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 190571f1c65dSBarry Smith PetscFunctionReturn(0); 190671f1c65dSBarry Smith } 190771f1c65dSBarry Smith 1908c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 1909d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1910d71ae5a4SJacob Faibussowitsch { 1911416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1912e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19132e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 191454f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19153d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 191697f1f81fSBarry Smith const PetscInt *idx, *diag; 191717ab2063SBarry Smith 19183a40ed3dSBarry Smith PetscFunctionBegin; 1919b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19209566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 1921b215bc84SStefano Zampini PetscFunctionReturn(0); 1922b215bc84SStefano Zampini } 1923b965ef7fSBarry Smith its = its * lits; 192491723122SBarry Smith 192571f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19269566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 192771f1c65dSBarry Smith a->fshift = fshift; 192871f1c65dSBarry Smith a->omega = omega; 1929ed480e8bSBarry Smith 193071f1c65dSBarry Smith diag = a->diag; 193171f1c65dSBarry Smith t = a->ssor_work; 1932ed480e8bSBarry Smith idiag = a->idiag; 193371f1c65dSBarry Smith mdiag = a->mdiag; 1934ed480e8bSBarry Smith 19359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19369566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19379566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1938ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 193917ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 194017ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1941ed480e8bSBarry Smith bs = b; 194217ab2063SBarry Smith for (i = 0; i < m; i++) { 194371f1c65dSBarry Smith d = fshift + mdiag[i]; 1944416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1945ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19462e5835c6SStefano Zampini v = aa + diag[i] + 1; 194717ab2063SBarry Smith sum = b[i] * d / omega; 1948003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 194917ab2063SBarry Smith x[i] = sum; 195017ab2063SBarry Smith } 19519566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19529566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19549566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19553a40ed3dSBarry Smith PetscFunctionReturn(0); 195617ab2063SBarry Smith } 1957c783ea89SBarry Smith 195808401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1959f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19604c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1961887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 196217ab2063SBarry Smith 196317ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 196417ab2063SBarry Smith 1965887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 196617ab2063SBarry Smith */ 196717ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 196817ab2063SBarry Smith 196917ab2063SBarry Smith /* x = (E + U)^{-1} b */ 197017ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1971416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1972ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19732e5835c6SStefano Zampini v = aa + diag[i] + 1; 197417ab2063SBarry Smith sum = b[i]; 1975e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1976ed480e8bSBarry Smith x[i] = sum * idiag[i]; 197717ab2063SBarry Smith } 197817ab2063SBarry Smith 197917ab2063SBarry Smith /* t = b - (2*E - D)x */ 19802e5835c6SStefano Zampini v = aa; 19812205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 198217ab2063SBarry Smith 198317ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1984ed480e8bSBarry Smith ts = t; 1985416022c9SBarry Smith diag = a->diag; 198617ab2063SBarry Smith for (i = 0; i < m; i++) { 1987416022c9SBarry Smith n = diag[i] - a->i[i]; 1988ed480e8bSBarry Smith idx = a->j + a->i[i]; 19892e5835c6SStefano Zampini v = aa + a->i[i]; 199017ab2063SBarry Smith sum = t[i]; 1991003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 1992ed480e8bSBarry Smith t[i] = sum * idiag[i]; 1993733d66baSBarry Smith /* x = x + t */ 1994733d66baSBarry Smith x[i] += t[i]; 199517ab2063SBarry Smith } 199617ab2063SBarry Smith 19979566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 19989566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19999566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20003a40ed3dSBarry Smith PetscFunctionReturn(0); 200117ab2063SBarry Smith } 200217ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 200317ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 200417ab2063SBarry Smith for (i = 0; i < m; i++) { 2005416022c9SBarry Smith n = diag[i] - a->i[i]; 2006ed480e8bSBarry Smith idx = a->j + a->i[i]; 20072e5835c6SStefano Zampini v = aa + a->i[i]; 200817ab2063SBarry Smith sum = b[i]; 2009e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20105c99c7daSBarry Smith t[i] = sum; 2011ed480e8bSBarry Smith x[i] = sum * idiag[i]; 201217ab2063SBarry Smith } 20135c99c7daSBarry Smith xb = t; 20149566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20153a40ed3dSBarry Smith } else xb = b; 201617ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 201717ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2018416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2019ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20202e5835c6SStefano Zampini v = aa + diag[i] + 1; 202117ab2063SBarry Smith sum = xb[i]; 2022e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20235c99c7daSBarry Smith if (xb == b) { 2024ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20255c99c7daSBarry Smith } else { 2026b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 202717ab2063SBarry Smith } 20285c99c7daSBarry Smith } 20299566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 203017ab2063SBarry Smith } 203117ab2063SBarry Smith its--; 203217ab2063SBarry Smith } 203317ab2063SBarry Smith while (its--) { 203417ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 203517ab2063SBarry Smith for (i = 0; i < m; i++) { 2036b19a5dc2SMark Adams /* lower */ 2037b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2038ed480e8bSBarry Smith idx = a->j + a->i[i]; 20392e5835c6SStefano Zampini v = aa + a->i[i]; 204017ab2063SBarry Smith sum = b[i]; 2041e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2042b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2043b19a5dc2SMark Adams /* upper */ 2044b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2045b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20462e5835c6SStefano Zampini v = aa + diag[i] + 1; 2047b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2048b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 204917ab2063SBarry Smith } 2050b19a5dc2SMark Adams xb = t; 20519566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2052b19a5dc2SMark Adams } else xb = b; 205317ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 205417ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2055b19a5dc2SMark Adams sum = xb[i]; 2056b19a5dc2SMark Adams if (xb == b) { 2057b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2058416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2059ed480e8bSBarry Smith idx = a->j + a->i[i]; 20602e5835c6SStefano Zampini v = aa + a->i[i]; 2061e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2062ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2063b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2064b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2065b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20662e5835c6SStefano Zampini v = aa + diag[i] + 1; 2067b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2068b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 206917ab2063SBarry Smith } 2070b19a5dc2SMark Adams } 2071b19a5dc2SMark Adams if (xb == b) { 20729566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2073b19a5dc2SMark Adams } else { 20749566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2075b19a5dc2SMark Adams } 207617ab2063SBarry Smith } 207717ab2063SBarry Smith } 20789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20799566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20809566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 2081365a8a9eSBarry Smith PetscFunctionReturn(0); 208217ab2063SBarry Smith } 208317ab2063SBarry Smith 2084d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2085d71ae5a4SJacob Faibussowitsch { 2086416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 20874e220ebcSLois Curfman McInnes 20883a40ed3dSBarry Smith PetscFunctionBegin; 20894e220ebcSLois Curfman McInnes info->block_size = 1.0; 20903966268fSBarry Smith info->nz_allocated = a->maxnz; 20913966268fSBarry Smith info->nz_used = a->nz; 20923966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 20933966268fSBarry Smith info->assemblies = A->num_ass; 20943966268fSBarry Smith info->mallocs = A->info.mallocs; 20954dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2096d5f3da31SBarry Smith if (A->factortype) { 20974e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 20984e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 20994e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21004e220ebcSLois Curfman McInnes } else { 21014e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21024e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21034e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21044e220ebcSLois Curfman McInnes } 21053a40ed3dSBarry Smith PetscFunctionReturn(0); 210617ab2063SBarry Smith } 210717ab2063SBarry Smith 2108d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2109d71ae5a4SJacob Faibussowitsch { 2110416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2111c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 211297b48c8fSBarry Smith const PetscScalar *xx; 21132e5835c6SStefano Zampini PetscScalar *bb, *aa; 2114c7da8527SEric Chamberland PetscInt d = 0; 211517ab2063SBarry Smith 21163a40ed3dSBarry Smith PetscFunctionBegin; 211797b48c8fSBarry Smith if (x && b) { 21189566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21199566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 212097b48c8fSBarry Smith for (i = 0; i < N; i++) { 2121aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2122447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 212397b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 212497b48c8fSBarry Smith } 21259566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21269566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 212797b48c8fSBarry Smith } 212897b48c8fSBarry Smith 21299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2130a9817697SBarry Smith if (a->keepnonzeropattern) { 2131f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2132aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21339566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2134f1e2ffcdSBarry Smith } 2135f4df32b1SMatthew Knepley if (diag != 0.0) { 2136c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2137c7da8527SEric Chamberland d = rows[i]; 2138447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 213908401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2140c7da8527SEric Chamberland } 2141f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2142447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21432e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2144f1e2ffcdSBarry Smith } 2145f1e2ffcdSBarry Smith } 2146f1e2ffcdSBarry Smith } else { 2147f4df32b1SMatthew Knepley if (diag != 0.0) { 214817ab2063SBarry Smith for (i = 0; i < N; i++) { 2149aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21507ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2151447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2152447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2153447d62f5SStefano Zampini } else { 2154416022c9SBarry Smith a->ilen[rows[i]] = 1; 21552e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2156bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2157447d62f5SStefano Zampini } 2158447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21599566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 216017ab2063SBarry Smith } 216117ab2063SBarry Smith } 21623a40ed3dSBarry Smith } else { 216317ab2063SBarry Smith for (i = 0; i < N; i++) { 2164aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2165416022c9SBarry Smith a->ilen[rows[i]] = 0; 216617ab2063SBarry Smith } 216717ab2063SBarry Smith } 2168e56f5c9eSBarry Smith A->nonzerostate++; 2169f1e2ffcdSBarry Smith } 21709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2171dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21723a40ed3dSBarry Smith PetscFunctionReturn(0); 217317ab2063SBarry Smith } 217417ab2063SBarry Smith 2175d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2176d71ae5a4SJacob Faibussowitsch { 21776e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21786e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21792b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 21806e169961SBarry Smith const PetscScalar *xx; 21812e5835c6SStefano Zampini PetscScalar *bb, *aa; 21826e169961SBarry Smith 21836e169961SBarry Smith PetscFunctionBegin; 21842e5835c6SStefano Zampini if (!N) PetscFunctionReturn(0); 21859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 21866e169961SBarry Smith if (x && b) { 21879566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21889566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 21892b40b63fSBarry Smith vecs = PETSC_TRUE; 21906e169961SBarry Smith } 21919566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 21926e169961SBarry Smith for (i = 0; i < N; i++) { 2193aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21949566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 21952205254eSKarl Rupp 21966e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 21976e169961SBarry Smith } 21986e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 21996e169961SBarry Smith if (!zeroed[i]) { 22006e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22014cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22022e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22032e5835c6SStefano Zampini aa[j] = 0.0; 22046e169961SBarry Smith } 22056e169961SBarry Smith } 22064cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22076e169961SBarry Smith } 22086e169961SBarry Smith if (x && b) { 22099566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22109566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22116e169961SBarry Smith } 22129566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22136e169961SBarry Smith if (diag != 0.0) { 22149566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22151d5a398dSstefano_zampini if (missing) { 22161d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22174cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2218aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22199566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22201d5a398dSstefano_zampini } 22211d5a398dSstefano_zampini } else { 2222ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22236e169961SBarry Smith } 22241d5a398dSstefano_zampini } 22259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2226dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22276e169961SBarry Smith PetscFunctionReturn(0); 22286e169961SBarry Smith } 22296e169961SBarry Smith 2230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2231d71ae5a4SJacob Faibussowitsch { 2232fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2233fff043a9SJunchao Zhang const PetscScalar *aa; 2234fff043a9SJunchao Zhang PetscInt *itmp; 223517ab2063SBarry Smith 22363a40ed3dSBarry Smith PetscFunctionBegin; 22379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2238416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22392e5835c6SStefano Zampini if (v) *v = (PetscScalar *)(aa + a->i[row]); 224017ab2063SBarry Smith if (idx) { 2241bfeeae90SHong Zhang itmp = a->j + a->i[row]; 224226fbe8dcSKarl Rupp if (*nz) *idx = itmp; 2243f4259b30SLisandro Dalcin else *idx = NULL; 224417ab2063SBarry Smith } 22459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22463a40ed3dSBarry Smith PetscFunctionReturn(0); 224717ab2063SBarry Smith } 224817ab2063SBarry Smith 2249d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2250d71ae5a4SJacob Faibussowitsch { 22513a40ed3dSBarry Smith PetscFunctionBegin; 2252cb4a9cd9SHong Zhang if (nz) *nz = 0; 22532e5835c6SStefano Zampini if (idx) *idx = NULL; 22542e5835c6SStefano Zampini if (v) *v = NULL; 22553a40ed3dSBarry Smith PetscFunctionReturn(0); 225617ab2063SBarry Smith } 225717ab2063SBarry Smith 2258d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2259d71ae5a4SJacob Faibussowitsch { 2260416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22612e5835c6SStefano Zampini const MatScalar *v; 226236db0b34SBarry Smith PetscReal sum = 0.0; 226397f1f81fSBarry Smith PetscInt i, j; 226417ab2063SBarry Smith 22653a40ed3dSBarry Smith PetscFunctionBegin; 22669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 226717ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2268570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2269570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2270792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2271570b7f6dSBarry Smith #else 2272416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22739371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22749371c9d4SSatish Balay v++; 227517ab2063SBarry Smith } 22768f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2277570b7f6dSBarry Smith #endif 22789566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22793a40ed3dSBarry Smith } else if (type == NORM_1) { 228036db0b34SBarry Smith PetscReal *tmp; 228197f1f81fSBarry Smith PetscInt *jj = a->j; 22829566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2283064f8208SBarry Smith *nrm = 0.0; 2284416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 22859371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 22869371c9d4SSatish Balay v++; 228717ab2063SBarry Smith } 2288d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2289064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 229017ab2063SBarry Smith } 22919566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 22929566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 22933a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2294064f8208SBarry Smith *nrm = 0.0; 2295d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 22962e5835c6SStefano Zampini const PetscScalar *v2 = v + a->i[j]; 229717ab2063SBarry Smith sum = 0.0; 2298416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 22999371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23009371c9d4SSatish Balay v2++; 230117ab2063SBarry Smith } 2302064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 230317ab2063SBarry Smith } 23049566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2305f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23073a40ed3dSBarry Smith PetscFunctionReturn(0); 230817ab2063SBarry Smith } 230917ab2063SBarry Smith 2310d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2311d71ae5a4SJacob Faibussowitsch { 23123d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 231354f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23142e5835c6SStefano Zampini const MatScalar *va, *vb; 231597f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2316cd0d46ebSvictorle 2317cd0d46ebSvictorle PetscFunctionBegin; 23189566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23199566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23205485867bSBarry Smith if (ma != nb || na != mb) { 23215485867bSBarry Smith *f = PETSC_FALSE; 23225485867bSBarry Smith PetscFunctionReturn(0); 23235485867bSBarry Smith } 23249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23269371c9d4SSatish Balay aii = aij->i; 23279371c9d4SSatish Balay bii = bij->i; 23289371c9d4SSatish Balay adx = aij->j; 23299371c9d4SSatish Balay bdx = bij->j; 23309566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23319566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2332cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2333cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2334cd0d46ebSvictorle 2335cd0d46ebSvictorle *f = PETSC_TRUE; 2336cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2337cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 233897f1f81fSBarry Smith PetscInt idc, idr; 23395485867bSBarry Smith PetscScalar vc, vr; 2340cd0d46ebSvictorle /* column/row index/value */ 23415485867bSBarry Smith idc = adx[aptr[i]]; 23425485867bSBarry Smith idr = bdx[bptr[idc]]; 23435485867bSBarry Smith vc = va[aptr[i]]; 23445485867bSBarry Smith vr = vb[bptr[idc]]; 23455485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23465485867bSBarry Smith *f = PETSC_FALSE; 23475485867bSBarry Smith goto done; 2348cd0d46ebSvictorle } else { 23495485867bSBarry Smith aptr[i]++; 23505485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2351cd0d46ebSvictorle } 2352cd0d46ebSvictorle } 2353cd0d46ebSvictorle } 2354cd0d46ebSvictorle done: 23559566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23569566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 2359cd0d46ebSvictorle PetscFunctionReturn(0); 2360cd0d46ebSvictorle } 2361cd0d46ebSvictorle 2362d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2363d71ae5a4SJacob Faibussowitsch { 23643d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 236554f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 236654f21887SBarry Smith MatScalar *va, *vb; 23671cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23681cbb95d3SBarry Smith 23691cbb95d3SBarry Smith PetscFunctionBegin; 23709566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23719566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23721cbb95d3SBarry Smith if (ma != nb || na != mb) { 23731cbb95d3SBarry Smith *f = PETSC_FALSE; 23741cbb95d3SBarry Smith PetscFunctionReturn(0); 23751cbb95d3SBarry Smith } 23769371c9d4SSatish Balay aii = aij->i; 23779371c9d4SSatish Balay bii = bij->i; 23789371c9d4SSatish Balay adx = aij->j; 23799371c9d4SSatish Balay bdx = bij->j; 23809371c9d4SSatish Balay va = aij->a; 23819371c9d4SSatish Balay vb = bij->a; 23829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23839566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23841cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 23851cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 23861cbb95d3SBarry Smith 23871cbb95d3SBarry Smith *f = PETSC_TRUE; 23881cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 23891cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 23901cbb95d3SBarry Smith PetscInt idc, idr; 23911cbb95d3SBarry Smith PetscScalar vc, vr; 23921cbb95d3SBarry Smith /* column/row index/value */ 23931cbb95d3SBarry Smith idc = adx[aptr[i]]; 23941cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 23951cbb95d3SBarry Smith vc = va[aptr[i]]; 23961cbb95d3SBarry Smith vr = vb[bptr[idc]]; 23971cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 23981cbb95d3SBarry Smith *f = PETSC_FALSE; 23991cbb95d3SBarry Smith goto done; 24001cbb95d3SBarry Smith } else { 24011cbb95d3SBarry Smith aptr[i]++; 24021cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24031cbb95d3SBarry Smith } 24041cbb95d3SBarry Smith } 24051cbb95d3SBarry Smith } 24061cbb95d3SBarry Smith done: 24079566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24089566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24091cbb95d3SBarry Smith PetscFunctionReturn(0); 24101cbb95d3SBarry Smith } 24111cbb95d3SBarry Smith 2412d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2413d71ae5a4SJacob Faibussowitsch { 24149e29f15eSvictorle PetscFunctionBegin; 24159566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f)); 24169e29f15eSvictorle PetscFunctionReturn(0); 24179e29f15eSvictorle } 24189e29f15eSvictorle 2419d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2420d71ae5a4SJacob Faibussowitsch { 24211cbb95d3SBarry Smith PetscFunctionBegin; 24229566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f)); 24231cbb95d3SBarry Smith PetscFunctionReturn(0); 24241cbb95d3SBarry Smith } 24251cbb95d3SBarry Smith 2426d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2427d71ae5a4SJacob Faibussowitsch { 2428416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2429fff8e43fSBarry Smith const PetscScalar *l, *r; 2430fff8e43fSBarry Smith PetscScalar x; 243154f21887SBarry Smith MatScalar *v; 2432fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2433fff8e43fSBarry Smith const PetscInt *jj; 243417ab2063SBarry Smith 24353a40ed3dSBarry Smith PetscFunctionBegin; 243617ab2063SBarry Smith if (ll) { 24373ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24383ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24399566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 244008401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24419566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 244317ab2063SBarry Smith for (i = 0; i < m; i++) { 244417ab2063SBarry Smith x = l[i]; 2445416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24462205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 244717ab2063SBarry Smith } 24489566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24499566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 245117ab2063SBarry Smith } 245217ab2063SBarry Smith if (rr) { 24539566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 245408401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24559566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24572e5835c6SStefano Zampini jj = a->j; 24582205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24609566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24619566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 246217ab2063SBarry Smith } 24639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24643a40ed3dSBarry Smith PetscFunctionReturn(0); 246517ab2063SBarry Smith } 246617ab2063SBarry Smith 2467d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2468d71ae5a4SJacob Faibussowitsch { 2469db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2470d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 247197f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24725d0c19d7SBarry Smith const PetscInt *irow, *icol; 24732e5835c6SStefano Zampini const PetscScalar *aa; 24745d0c19d7SBarry Smith PetscInt nrows, ncols; 247597f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 247654f21887SBarry Smith MatScalar *a_new, *mat_a; 2477416022c9SBarry Smith Mat C; 2478cdc6f3adSToby Isaac PetscBool stride; 247917ab2063SBarry Smith 24803a40ed3dSBarry Smith PetscFunctionBegin; 24819566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24829566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24839566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 248417ab2063SBarry Smith 24859566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2486ff718158SBarry Smith if (stride) { 24879566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2488ff718158SBarry Smith } else { 2489ff718158SBarry Smith first = 0; 2490ff718158SBarry Smith step = 0; 2491ff718158SBarry Smith } 2492fee21e36SBarry Smith if (stride && step == 1) { 249302834360SBarry Smith /* special case of contiguous rows */ 24949566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 249502834360SBarry Smith /* loop over new rows determining lens and starting points */ 249602834360SBarry Smith for (i = 0; i < nrows; i++) { 2497bfeeae90SHong Zhang kstart = ai[irow[i]]; 2498a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2499a91a9bebSLisandro Dalcin starts[i] = kstart; 250002834360SBarry Smith for (k = kstart; k < kend; k++) { 2501bfeeae90SHong Zhang if (aj[k] >= first) { 250202834360SBarry Smith starts[i] = k; 250302834360SBarry Smith break; 250402834360SBarry Smith } 250502834360SBarry Smith } 2506a2744918SBarry Smith sum = 0; 250702834360SBarry Smith while (k < kend) { 2508bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2509a2744918SBarry Smith sum++; 251002834360SBarry Smith } 2511a2744918SBarry Smith lens[i] = sum; 251202834360SBarry Smith } 251302834360SBarry Smith /* create submatrix */ 2514cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 251597f1f81fSBarry Smith PetscInt n_cols, n_rows; 25169566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2517aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25189566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 251908480c60SBarry Smith C = *B; 25203a40ed3dSBarry Smith } else { 25213bef6203SJed Brown PetscInt rbs, cbs; 25229566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25239566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25249566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25259566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25269566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25279566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 252908480c60SBarry Smith } 2530db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2531db02288aSLois Curfman McInnes 253202834360SBarry Smith /* loop over rows inserting into submatrix */ 2533db02288aSLois Curfman McInnes a_new = c->a; 2534db02288aSLois Curfman McInnes j_new = c->j; 2535db02288aSLois Curfman McInnes i_new = c->i; 25369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 253702834360SBarry Smith for (i = 0; i < nrows; i++) { 2538a2744918SBarry Smith ii = starts[i]; 2539a2744918SBarry Smith lensi = lens[i]; 2540ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25419566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2542a2744918SBarry Smith a_new += lensi; 2543a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2544a2744918SBarry Smith c->ilen[i] = lensi; 254502834360SBarry Smith } 25469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25479566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25483a40ed3dSBarry Smith } else { 25499566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25524dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25536bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25544dcab191SBarry Smith smap[icol[i]] = i + 1; 25554dcab191SBarry Smith } 25564dcab191SBarry Smith 255702834360SBarry Smith /* determine lens of each row */ 255802834360SBarry Smith for (i = 0; i < nrows; i++) { 2559bfeeae90SHong Zhang kstart = ai[irow[i]]; 256002834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 256102834360SBarry Smith lens[i] = 0; 256202834360SBarry Smith for (k = kstart; k < kend; k++) { 2563ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 256402834360SBarry Smith } 256502834360SBarry Smith } 256617ab2063SBarry Smith /* Create and fill new matrix */ 2567a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2568ace3abfcSBarry Smith PetscBool equal; 25690f5bd95cSBarry Smith 257099141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2571aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25729566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 257328b400f6SJacob Faibussowitsch PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong no of nonzeros"); 25749566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 257508480c60SBarry Smith C = *B; 25763a40ed3dSBarry Smith } else { 25773bef6203SJed Brown PetscInt rbs, cbs; 25789566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25799566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25809566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25819566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25829566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25839566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 258508480c60SBarry Smith } 25869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 258799141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 258817ab2063SBarry Smith for (i = 0; i < nrows; i++) { 258999141d43SSatish Balay row = irow[i]; 2590bfeeae90SHong Zhang kstart = ai[row]; 259199141d43SSatish Balay kend = kstart + a->ilen[row]; 2592bfeeae90SHong Zhang mat_i = c->i[i]; 259399141d43SSatish Balay mat_j = c->j + mat_i; 259499141d43SSatish Balay mat_a = c->a + mat_i; 259599141d43SSatish Balay mat_ilen = c->ilen + i; 259617ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2597bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2598ed480e8bSBarry Smith *mat_j++ = tcol - 1; 25992e5835c6SStefano Zampini *mat_a++ = aa[k]; 260099141d43SSatish Balay (*mat_ilen)++; 260117ab2063SBarry Smith } 260217ab2063SBarry Smith } 260317ab2063SBarry Smith } 26049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 260502834360SBarry Smith /* Free work space */ 26069566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26079566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26089566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2609cdc6f3adSToby Isaac /* sort */ 2610cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2611cdc6f3adSToby Isaac PetscInt ilen; 2612cdc6f3adSToby Isaac 2613cdc6f3adSToby Isaac mat_i = c->i[i]; 2614cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2615cdc6f3adSToby Isaac mat_a = c->a + mat_i; 2616cdc6f3adSToby Isaac ilen = c->ilen[i]; 26179566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2618cdc6f3adSToby Isaac } 261902834360SBarry Smith } 26208c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26219566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2622305c6ccfSStefano Zampini #endif 26239566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26249566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 262517ab2063SBarry Smith 26269566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2627416022c9SBarry Smith *B = C; 26283a40ed3dSBarry Smith PetscFunctionReturn(0); 262917ab2063SBarry Smith } 263017ab2063SBarry Smith 2631d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2632d71ae5a4SJacob Faibussowitsch { 263382d44351SHong Zhang Mat B; 263482d44351SHong Zhang 263582d44351SHong Zhang PetscFunctionBegin; 2636c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26379566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26389566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26399566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26409566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26419566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 264282d44351SHong Zhang *subMat = B; 2643c2d650bdSHong Zhang } else { 26449566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2645c2d650bdSHong Zhang } 264682d44351SHong Zhang PetscFunctionReturn(0); 264782d44351SHong Zhang } 264882d44351SHong Zhang 2649d71ae5a4SJacob Faibussowitsch PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2650d71ae5a4SJacob Faibussowitsch { 265163b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 265263b91edcSBarry Smith Mat outA; 2653ace3abfcSBarry Smith PetscBool row_identity, col_identity; 265463b91edcSBarry Smith 26553a40ed3dSBarry Smith PetscFunctionBegin; 265608401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26571df811f5SHong Zhang 26589566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26599566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2660a871dcd8SBarry Smith 266163b91edcSBarry Smith outA = inA; 2662d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26639566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26649566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26652205254eSKarl Rupp 26669566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26679566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26682205254eSKarl Rupp 2669c3122656SLisandro Dalcin a->row = row; 26702205254eSKarl Rupp 26719566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26729566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26732205254eSKarl Rupp 2674c3122656SLisandro Dalcin a->col = col; 267563b91edcSBarry Smith 267636db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26779566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26789566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2679f0ec6fceSSatish Balay 268094a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26819566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 268294a9d846SBarry Smith } 268363b91edcSBarry Smith 26849566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2685137fb511SHong Zhang if (row_identity && col_identity) { 26869566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2687137fb511SHong Zhang } else { 26889566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2689137fb511SHong Zhang } 26903a40ed3dSBarry Smith PetscFunctionReturn(0); 2691a871dcd8SBarry Smith } 2692a871dcd8SBarry Smith 2693d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2694d71ae5a4SJacob Faibussowitsch { 2695f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2696dfa0f9e5SStefano Zampini PetscScalar *v; 2697c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 26983a40ed3dSBarry Smith 26993a40ed3dSBarry Smith PetscFunctionBegin; 27009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27019566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2702792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27039566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27063a40ed3dSBarry Smith PetscFunctionReturn(0); 2707f0b747eeSBarry Smith } 2708f0b747eeSBarry Smith 2709d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2710d71ae5a4SJacob Faibussowitsch { 271116b64355SHong Zhang PetscInt i; 271216b64355SHong Zhang 271316b64355SHong Zhang PetscFunctionBegin; 271416b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27159566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 271616b64355SHong Zhang 271748a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27189566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 271916b64355SHong Zhang 272016b64355SHong Zhang if (submatj->rbuf1) { 27219566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27229566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 272316b64355SHong Zhang } 272416b64355SHong Zhang 272548a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27269566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27279566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 272816b64355SHong Zhang } 272916b64355SHong Zhang 273016b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 27319566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable *)&submatj->rmap)); 27329566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27339566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 273416b64355SHong Zhang #else 27359566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 273616b64355SHong Zhang #endif 273716b64355SHong Zhang 273816b64355SHong Zhang if (!submatj->allcolumns) { 273916b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 27409566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable *)&submatj->cmap)); 274116b64355SHong Zhang #else 27429566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 274316b64355SHong Zhang #endif 274416b64355SHong Zhang } 27459566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 274616b64355SHong Zhang 27479566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 274816b64355SHong Zhang PetscFunctionReturn(0); 274916b64355SHong Zhang } 275016b64355SHong Zhang 2751d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2752d71ae5a4SJacob Faibussowitsch { 275316b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27545c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 275516b64355SHong Zhang 275616b64355SHong Zhang PetscFunctionBegin; 27579566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27589566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 275916b64355SHong Zhang PetscFunctionReturn(0); 276016b64355SHong Zhang } 276116b64355SHong Zhang 276289a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2763d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2764d71ae5a4SJacob Faibussowitsch { 27652d033e1fSHong Zhang PetscInt i; 27660fb991dcSHong Zhang Mat C; 27670fb991dcSHong Zhang Mat_SeqAIJ *c; 27680fb991dcSHong Zhang Mat_SubSppt *submatj; 27692d033e1fSHong Zhang 27702d033e1fSHong Zhang PetscFunctionBegin; 27712d033e1fSHong Zhang for (i = 0; i < n; i++) { 27720fb991dcSHong Zhang C = (*mat)[i]; 27730fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27740fb991dcSHong Zhang submatj = c->submatis1; 27752d033e1fSHong Zhang if (submatj) { 2776682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 277726cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27789566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27799566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27809566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27813faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27829566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27839566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27849566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2785682e4c99SStefano Zampini } 27862d033e1fSHong Zhang } else { 27879566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 27882d033e1fSHong Zhang } 27892d033e1fSHong Zhang } 279086e85357SHong Zhang 279163a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 27929566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 279363a75b2aSHong Zhang 27949566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 27952d033e1fSHong Zhang PetscFunctionReturn(0); 27962d033e1fSHong Zhang } 27972d033e1fSHong Zhang 2798d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2799d71ae5a4SJacob Faibussowitsch { 280097f1f81fSBarry Smith PetscInt i; 2801cddf8d76SBarry Smith 28023a40ed3dSBarry Smith PetscFunctionBegin; 280348a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2804cddf8d76SBarry Smith 280548a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28063a40ed3dSBarry Smith PetscFunctionReturn(0); 2807cddf8d76SBarry Smith } 2808cddf8d76SBarry Smith 2809d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2810d71ae5a4SJacob Faibussowitsch { 2811e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28125d0c19d7SBarry Smith PetscInt row, i, j, k, l, m, n, *nidx, isz, val; 28135d0c19d7SBarry Smith const PetscInt *idx; 281497f1f81fSBarry Smith PetscInt start, end, *ai, *aj; 2815f1af5d2fSBarry Smith PetscBT table; 2816bbd702dbSSatish Balay 28173a40ed3dSBarry Smith PetscFunctionBegin; 2818d0f46423SBarry Smith m = A->rmap->n; 2819e4d965acSSatish Balay ai = a->i; 2820bfeeae90SHong Zhang aj = a->j; 28218a047759SSatish Balay 282208401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 282306763907SSatish Balay 28249566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28259566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 282606763907SSatish Balay 2827e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2828b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2829e4d965acSSatish Balay isz = 0; 28309566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2831e4d965acSSatish Balay 2832e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28339566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28349566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2835e4d965acSSatish Balay 2836dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2837e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28382205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28394dcbc457SBarry Smith } 28409566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28419566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2842e4d965acSSatish Balay 284304a348a9SBarry Smith k = 0; 284404a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 284504a348a9SBarry Smith n = isz; 284606763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2847e4d965acSSatish Balay row = nidx[k]; 2848e4d965acSSatish Balay start = ai[row]; 2849e4d965acSSatish Balay end = ai[row + 1]; 285004a348a9SBarry Smith for (l = start; l < end; l++) { 2851efb16452SHong Zhang val = aj[l]; 28522205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2853e4d965acSSatish Balay } 2854e4d965acSSatish Balay } 2855e4d965acSSatish Balay } 28569566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2857e4d965acSSatish Balay } 28589566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28599566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28603a40ed3dSBarry Smith PetscFunctionReturn(0); 28614dcbc457SBarry Smith } 286217ab2063SBarry Smith 28630513a670SBarry Smith /* -------------------------------------------------------------- */ 2864d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2865d71ae5a4SJacob Faibussowitsch { 28660513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28673b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 28685d0c19d7SBarry Smith const PetscInt *row, *col; 28695d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 287056cd22aeSBarry Smith IS icolp, irowp; 28710298fd71SBarry Smith PetscInt *cwork = NULL; 28720298fd71SBarry Smith PetscScalar *vwork = NULL; 28730513a670SBarry Smith 28743a40ed3dSBarry Smith PetscFunctionBegin; 28759566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 28769566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 28779566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 28789566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 28790513a670SBarry Smith 28800513a670SBarry Smith /* determine lengths of permuted rows */ 28819566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 28822205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 28839566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 28849566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 28859566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 28869566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 28879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 28889566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 28890513a670SBarry Smith 28909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 28910513a670SBarry Smith for (i = 0; i < m; i++) { 28929566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 28932205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 28949566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 28959566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 28960513a670SBarry Smith } 28979566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 28982205254eSKarl Rupp 28993c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29002205254eSKarl Rupp 29018c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29029566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29039fe5e383SStefano Zampini #endif 29049566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29059566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29069566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29079566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29089566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29099566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 291048a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29113a40ed3dSBarry Smith PetscFunctionReturn(0); 29120513a670SBarry Smith } 29130513a670SBarry Smith 2914d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2915d71ae5a4SJacob Faibussowitsch { 2916cb5b572fSBarry Smith PetscFunctionBegin; 291733f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 291833f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2919be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2920be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29212e5835c6SStefano Zampini const PetscScalar *aa; 2922be6bf707SBarry Smith 29239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 292408401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29259566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29269566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2928cb5b572fSBarry Smith } else { 29299566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2930cb5b572fSBarry Smith } 2931cb5b572fSBarry Smith PetscFunctionReturn(0); 2932cb5b572fSBarry Smith } 2933cb5b572fSBarry Smith 2934d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetUp_SeqAIJ(Mat A) 2935d71ae5a4SJacob Faibussowitsch { 2936273d9f13SBarry Smith PetscFunctionBegin; 29379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, PETSC_DEFAULT, NULL)); 2938273d9f13SBarry Smith PetscFunctionReturn(0); 2939273d9f13SBarry Smith } 2940273d9f13SBarry Smith 2941d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2942d71ae5a4SJacob Faibussowitsch { 29436c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29446e111a19SKarl Rupp 29456c0721eeSBarry Smith PetscFunctionBegin; 29466c0721eeSBarry Smith *array = a->a; 29476c0721eeSBarry Smith PetscFunctionReturn(0); 29486c0721eeSBarry Smith } 29496c0721eeSBarry Smith 2950d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2951d71ae5a4SJacob Faibussowitsch { 29526c0721eeSBarry Smith PetscFunctionBegin; 2953f38c1e66SStefano Zampini *array = NULL; 29546c0721eeSBarry Smith PetscFunctionReturn(0); 29556c0721eeSBarry Smith } 2956273d9f13SBarry Smith 29578229c054SShri Abhyankar /* 29588229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29598229c054SShri Abhyankar have different nonzero structure. 29608229c054SShri Abhyankar */ 2961d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2962d71ae5a4SJacob Faibussowitsch { 2963b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2964ec7775f6SShri Abhyankar 2965ec7775f6SShri Abhyankar PetscFunctionBegin; 2966ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2967ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 2968b264fe52SHong Zhang const PetscInt *xjj = xj + xi[i], *yjj = yj + yi[i]; 2969b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 2970b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 29718af7cee1SJed Brown nnz[i] = 0; 29728af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 2973b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 2974b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 29758af7cee1SJed Brown nnz[i]++; 29768af7cee1SJed Brown } 29778af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 2978ec7775f6SShri Abhyankar } 2979ec7775f6SShri Abhyankar PetscFunctionReturn(0); 2980ec7775f6SShri Abhyankar } 2981ec7775f6SShri Abhyankar 2982d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 2983d71ae5a4SJacob Faibussowitsch { 2984b264fe52SHong Zhang PetscInt m = Y->rmap->N; 2985b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 2986b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 2987b264fe52SHong Zhang 2988b264fe52SHong Zhang PetscFunctionBegin; 2989b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 29909566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 2991b264fe52SHong Zhang PetscFunctionReturn(0); 2992b264fe52SHong Zhang } 2993b264fe52SHong Zhang 2994d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 2995d71ae5a4SJacob Faibussowitsch { 2996ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 2997ac90fabeSBarry Smith 2998ac90fabeSBarry Smith PetscFunctionBegin; 2999134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3000134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3001134adf20SPierre Jolivet if (e) { 30029566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 300381fa06acSBarry Smith if (e) { 30049566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3005134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 300681fa06acSBarry Smith } 300781fa06acSBarry Smith } 300854c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 300981fa06acSBarry Smith } 3010ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30112e5835c6SStefano Zampini const PetscScalar *xa; 30122e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 301381fa06acSBarry Smith PetscBLASInt one = 1, bnz; 301481fa06acSBarry Smith 30159566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3018792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30219566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30239566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3024ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30259566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3026ac90fabeSBarry Smith } else { 30278229c054SShri Abhyankar Mat B; 30288229c054SShri Abhyankar PetscInt *nnz; 30299566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30309566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30319566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30329566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30339566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30349566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30369566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30379566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30389bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30399566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3040ac90fabeSBarry Smith } 3041ac90fabeSBarry Smith PetscFunctionReturn(0); 3042ac90fabeSBarry Smith } 3043ac90fabeSBarry Smith 3044d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3045d71ae5a4SJacob Faibussowitsch { 3046354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3047354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3048354c94deSBarry Smith PetscInt i, nz; 3049354c94deSBarry Smith PetscScalar *a; 3050354c94deSBarry Smith 3051354c94deSBarry Smith PetscFunctionBegin; 3052354c94deSBarry Smith nz = aij->nz; 30539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30542205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3056354c94deSBarry Smith #else 3057354c94deSBarry Smith PetscFunctionBegin; 3058354c94deSBarry Smith #endif 3059354c94deSBarry Smith PetscFunctionReturn(0); 3060354c94deSBarry Smith } 3061354c94deSBarry Smith 3062d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3063d71ae5a4SJacob Faibussowitsch { 3064e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3065d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3066e34fafa9SBarry Smith PetscReal atmp; 3067985db425SBarry Smith PetscScalar *x; 3068ce496241SStefano Zampini const MatScalar *aa, *av; 3069e34fafa9SBarry Smith 3070e34fafa9SBarry Smith PetscFunctionBegin; 307128b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 30729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3073ce496241SStefano Zampini aa = av; 3074e34fafa9SBarry Smith ai = a->i; 3075e34fafa9SBarry Smith aj = a->j; 3076e34fafa9SBarry Smith 30779566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 30789566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 30799566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 308008401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3081e34fafa9SBarry Smith for (i = 0; i < m; i++) { 30829371c9d4SSatish Balay ncols = ai[1] - ai[0]; 30839371c9d4SSatish Balay ai++; 3084e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3085985db425SBarry Smith atmp = PetscAbsScalar(*aa); 30869371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 30879371c9d4SSatish Balay x[i] = atmp; 30889371c9d4SSatish Balay if (idx) idx[i] = *aj; 30899371c9d4SSatish Balay } 30909371c9d4SSatish Balay aa++; 30919371c9d4SSatish Balay aj++; 3092985db425SBarry Smith } 3093985db425SBarry Smith } 30949566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 30959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3096985db425SBarry Smith PetscFunctionReturn(0); 3097985db425SBarry Smith } 3098985db425SBarry Smith 3099d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3100d71ae5a4SJacob Faibussowitsch { 3101985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3102d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3103985db425SBarry Smith PetscScalar *x; 3104ce496241SStefano Zampini const MatScalar *aa, *av; 3105985db425SBarry Smith 3106985db425SBarry Smith PetscFunctionBegin; 310728b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3109ce496241SStefano Zampini aa = av; 3110985db425SBarry Smith ai = a->i; 3111985db425SBarry Smith aj = a->j; 3112985db425SBarry Smith 31139566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31149566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31159566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 311608401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3117985db425SBarry Smith for (i = 0; i < m; i++) { 31189371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31199371c9d4SSatish Balay ai++; 3120d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31219371c9d4SSatish Balay x[i] = *aa; 31229371c9d4SSatish Balay if (idx) idx[i] = 0; 3123985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3124985db425SBarry Smith x[i] = 0.0; 3125985db425SBarry Smith if (idx) { 3126985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3127985db425SBarry Smith if (aj[j] > j) { 3128985db425SBarry Smith idx[i] = j; 3129985db425SBarry Smith break; 3130985db425SBarry Smith } 3131985db425SBarry Smith } 31321a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31331a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3134985db425SBarry Smith } 3135985db425SBarry Smith } 3136985db425SBarry Smith for (j = 0; j < ncols; j++) { 31379371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31389371c9d4SSatish Balay x[i] = *aa; 31399371c9d4SSatish Balay if (idx) idx[i] = *aj; 31409371c9d4SSatish Balay } 31419371c9d4SSatish Balay aa++; 31429371c9d4SSatish Balay aj++; 3143985db425SBarry Smith } 3144985db425SBarry Smith } 31459566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3147985db425SBarry Smith PetscFunctionReturn(0); 3148985db425SBarry Smith } 3149985db425SBarry Smith 3150d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3151d71ae5a4SJacob Faibussowitsch { 3152c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3153c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3154ce496241SStefano Zampini PetscScalar *x; 3155ce496241SStefano Zampini const MatScalar *aa, *av; 3156c87e5d42SMatthew Knepley 3157c87e5d42SMatthew Knepley PetscFunctionBegin; 31589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3159ce496241SStefano Zampini aa = av; 3160c87e5d42SMatthew Knepley ai = a->i; 3161c87e5d42SMatthew Knepley aj = a->j; 3162c87e5d42SMatthew Knepley 31639566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31649566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31659566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 316608401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3167c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 31689371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31699371c9d4SSatish Balay ai++; 3170f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 31719371c9d4SSatish Balay x[i] = *aa; 31729371c9d4SSatish Balay if (idx) idx[i] = 0; 3173f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3174f07e67edSHong Zhang x[i] = 0.0; 3175f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3176289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3177f07e67edSHong Zhang if (aj[j] > j) { 3178f07e67edSHong Zhang idx[i] = j; 31792205254eSKarl Rupp break; 31802205254eSKarl Rupp } 3181289a08f5SMatthew Knepley } 3182f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3183f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3184f07e67edSHong Zhang } 3185289a08f5SMatthew Knepley } 3186c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 31879371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 31889371c9d4SSatish Balay x[i] = *aa; 31899371c9d4SSatish Balay if (idx) idx[i] = *aj; 31909371c9d4SSatish Balay } 31919371c9d4SSatish Balay aa++; 31929371c9d4SSatish Balay aj++; 3193c87e5d42SMatthew Knepley } 3194c87e5d42SMatthew Knepley } 31959566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3197c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3198c87e5d42SMatthew Knepley } 3199c87e5d42SMatthew Knepley 3200d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3201d71ae5a4SJacob Faibussowitsch { 3202985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3203d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3204d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3205985db425SBarry Smith PetscScalar *x; 3206ce496241SStefano Zampini const MatScalar *aa, *av; 3207985db425SBarry Smith 3208985db425SBarry Smith PetscFunctionBegin; 320928b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3211ce496241SStefano Zampini aa = av; 3212985db425SBarry Smith ai = a->i; 3213985db425SBarry Smith aj = a->j; 3214985db425SBarry Smith 32159566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32169566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32179566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 321808401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3219985db425SBarry Smith for (i = 0; i < m; i++) { 32209371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32219371c9d4SSatish Balay ai++; 3222d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32239371c9d4SSatish Balay x[i] = *aa; 32249371c9d4SSatish Balay if (idx) idx[i] = 0; 3225985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3226985db425SBarry Smith x[i] = 0.0; 3227985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3228985db425SBarry Smith for (j = 0; j < ncols; j++) { 3229985db425SBarry Smith if (aj[j] > j) { 3230985db425SBarry Smith idx[i] = j; 3231985db425SBarry Smith break; 3232985db425SBarry Smith } 3233985db425SBarry Smith } 3234fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3235fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3236985db425SBarry Smith } 3237985db425SBarry Smith } 3238985db425SBarry Smith for (j = 0; j < ncols; j++) { 32399371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32409371c9d4SSatish Balay x[i] = *aa; 32419371c9d4SSatish Balay if (idx) idx[i] = *aj; 32429371c9d4SSatish Balay } 32439371c9d4SSatish Balay aa++; 32449371c9d4SSatish Balay aj++; 3245e34fafa9SBarry Smith } 3246e34fafa9SBarry Smith } 32479566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3249e34fafa9SBarry Smith PetscFunctionReturn(0); 3250e34fafa9SBarry Smith } 3251bbead8a2SBarry Smith 3252d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3253d71ae5a4SJacob Faibussowitsch { 3254bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 325533d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3256bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 32570da83c2eSBarry Smith const PetscReal shift = 0.0; 32581a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3259bbead8a2SBarry Smith 3260bbead8a2SBarry Smith PetscFunctionBegin; 3261a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 32624a0d0026SBarry Smith if (a->ibdiagvalid) { 32634a0d0026SBarry Smith if (values) *values = a->ibdiag; 32644a0d0026SBarry Smith PetscFunctionReturn(0); 32654a0d0026SBarry Smith } 32669566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 32674dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3268bbead8a2SBarry Smith diag = a->ibdiag; 3269bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3270bbead8a2SBarry Smith /* factor and invert each block */ 3271bbead8a2SBarry Smith switch (bs) { 3272bbead8a2SBarry Smith case 1: 3273bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 32749566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3275ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3276ec1892c8SHong Zhang if (allowzeropivot) { 32777b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 32787b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 32797b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 32809566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 328198921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3282ec1892c8SHong Zhang } 3283bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3284bbead8a2SBarry Smith } 3285bbead8a2SBarry Smith break; 3286bbead8a2SBarry Smith case 2: 3287bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 32889371c9d4SSatish Balay ij[0] = 2 * i; 32899371c9d4SSatish Balay ij[1] = 2 * i + 1; 32909566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 32919566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 32927b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 32939566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3294bbead8a2SBarry Smith diag += 4; 3295bbead8a2SBarry Smith } 3296bbead8a2SBarry Smith break; 3297bbead8a2SBarry Smith case 3: 3298bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 32999371c9d4SSatish Balay ij[0] = 3 * i; 33009371c9d4SSatish Balay ij[1] = 3 * i + 1; 33019371c9d4SSatish Balay ij[2] = 3 * i + 2; 33029566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33039566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33047b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33059566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3306bbead8a2SBarry Smith diag += 9; 3307bbead8a2SBarry Smith } 3308bbead8a2SBarry Smith break; 3309bbead8a2SBarry Smith case 4: 3310bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33119371c9d4SSatish Balay ij[0] = 4 * i; 33129371c9d4SSatish Balay ij[1] = 4 * i + 1; 33139371c9d4SSatish Balay ij[2] = 4 * i + 2; 33149371c9d4SSatish Balay ij[3] = 4 * i + 3; 33159566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33169566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33177b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33189566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3319bbead8a2SBarry Smith diag += 16; 3320bbead8a2SBarry Smith } 3321bbead8a2SBarry Smith break; 3322bbead8a2SBarry Smith case 5: 3323bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33249371c9d4SSatish Balay ij[0] = 5 * i; 33259371c9d4SSatish Balay ij[1] = 5 * i + 1; 33269371c9d4SSatish Balay ij[2] = 5 * i + 2; 33279371c9d4SSatish Balay ij[3] = 5 * i + 3; 33289371c9d4SSatish Balay ij[4] = 5 * i + 4; 33299566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33309566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33317b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33329566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3333bbead8a2SBarry Smith diag += 25; 3334bbead8a2SBarry Smith } 3335bbead8a2SBarry Smith break; 3336bbead8a2SBarry Smith case 6: 3337bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33389371c9d4SSatish Balay ij[0] = 6 * i; 33399371c9d4SSatish Balay ij[1] = 6 * i + 1; 33409371c9d4SSatish Balay ij[2] = 6 * i + 2; 33419371c9d4SSatish Balay ij[3] = 6 * i + 3; 33429371c9d4SSatish Balay ij[4] = 6 * i + 4; 33439371c9d4SSatish Balay ij[5] = 6 * i + 5; 33449566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33459566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33467b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3348bbead8a2SBarry Smith diag += 36; 3349bbead8a2SBarry Smith } 3350bbead8a2SBarry Smith break; 3351bbead8a2SBarry Smith case 7: 3352bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33539371c9d4SSatish Balay ij[0] = 7 * i; 33549371c9d4SSatish Balay ij[1] = 7 * i + 1; 33559371c9d4SSatish Balay ij[2] = 7 * i + 2; 33569371c9d4SSatish Balay ij[3] = 7 * i + 3; 33579371c9d4SSatish Balay ij[4] = 7 * i + 4; 33589371c9d4SSatish Balay ij[5] = 7 * i + 5; 33599371c9d4SSatish Balay ij[5] = 7 * i + 6; 33609566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 33619566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 33627b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33639566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3364bbead8a2SBarry Smith diag += 49; 3365bbead8a2SBarry Smith } 3366bbead8a2SBarry Smith break; 3367bbead8a2SBarry Smith default: 33689566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3369bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3370ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 33719566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 33729566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 33737b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33749566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3375bbead8a2SBarry Smith diag += bs2; 3376bbead8a2SBarry Smith } 33779566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3378bbead8a2SBarry Smith } 3379bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3380bbead8a2SBarry Smith PetscFunctionReturn(0); 3381bbead8a2SBarry Smith } 3382bbead8a2SBarry Smith 3383d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3384d71ae5a4SJacob Faibussowitsch { 338573a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3386fff043a9SJunchao Zhang PetscScalar a, *aa; 338773a71a0fSBarry Smith PetscInt m, n, i, j, col; 338873a71a0fSBarry Smith 338973a71a0fSBarry Smith PetscFunctionBegin; 339073a71a0fSBarry Smith if (!x->assembled) { 33919566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 339273a71a0fSBarry Smith for (i = 0; i < m; i++) { 339373a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 33949566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 339573a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 33969566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 339773a71a0fSBarry Smith } 339873a71a0fSBarry Smith } 3399e2ce353bSJunchao Zhang } else { 34009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34019566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3403e2ce353bSJunchao Zhang } 34049566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34059566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 340673a71a0fSBarry Smith PetscFunctionReturn(0); 340773a71a0fSBarry Smith } 340873a71a0fSBarry Smith 3409679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3410d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3411d71ae5a4SJacob Faibussowitsch { 3412679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3413679944adSJunchao Zhang PetscScalar a; 3414679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3415679944adSJunchao Zhang 3416679944adSJunchao Zhang PetscFunctionBegin; 3417679944adSJunchao Zhang nskip = high - low; 34189566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3419679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3420679944adSJunchao Zhang for (i = 0; i < m; i++) { 3421679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34229566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3423679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3424679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34259566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3426679944adSJunchao Zhang } 3427e2ce353bSJunchao Zhang } 34289566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34299566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 3430679944adSJunchao Zhang PetscFunctionReturn(0); 3431679944adSJunchao Zhang } 3432679944adSJunchao Zhang 3433682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 34340a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3435cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3436cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3437cb5b572fSBarry Smith MatMult_SeqAIJ, 343897304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34397c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34407c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3441f4259b30SLisandro Dalcin NULL, 3442f4259b30SLisandro Dalcin NULL, 3443f4259b30SLisandro Dalcin NULL, 3444f4259b30SLisandro Dalcin /* 10*/ NULL, 3445cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3446f4259b30SLisandro Dalcin NULL, 344741f059aeSBarry Smith MatSOR_SeqAIJ, 344891e9d3e2SHong Zhang MatTranspose_SeqAIJ, 344997304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3450cb5b572fSBarry Smith MatEqual_SeqAIJ, 3451cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3452cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3453cb5b572fSBarry Smith MatNorm_SeqAIJ, 3454f4259b30SLisandro Dalcin /* 20*/ NULL, 3455cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3456cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3457cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3458d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3459f4259b30SLisandro Dalcin NULL, 3460f4259b30SLisandro Dalcin NULL, 3461f4259b30SLisandro Dalcin NULL, 3462f4259b30SLisandro Dalcin NULL, 34634994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3464f4259b30SLisandro Dalcin NULL, 3465f4259b30SLisandro Dalcin NULL, 3466f4259b30SLisandro Dalcin NULL, 3467f4259b30SLisandro Dalcin NULL, 3468d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3469f4259b30SLisandro Dalcin NULL, 3470f4259b30SLisandro Dalcin NULL, 3471cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3472f4259b30SLisandro Dalcin NULL, 3473d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 34747dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3475cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3476cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3477cb5b572fSBarry Smith MatCopy_SeqAIJ, 3478d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3479cb5b572fSBarry Smith MatScale_SeqAIJ, 34807d68702bSBarry Smith MatShift_SeqAIJ, 348179299369SBarry Smith MatDiagonalSet_SeqAIJ, 34826e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 348373a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 34843b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 34853b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 34863b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3487a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 348893dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3489f4259b30SLisandro Dalcin NULL, 3490f4259b30SLisandro Dalcin NULL, 3491cda55fadSBarry Smith MatPermute_SeqAIJ, 3492f4259b30SLisandro Dalcin NULL, 3493f4259b30SLisandro Dalcin /* 59*/ NULL, 3494b9b97703SBarry Smith MatDestroy_SeqAIJ, 3495b9b97703SBarry Smith MatView_SeqAIJ, 3496f4259b30SLisandro Dalcin NULL, 3497f4259b30SLisandro Dalcin NULL, 3498f4259b30SLisandro Dalcin /* 64*/ NULL, 3499321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3500f4259b30SLisandro Dalcin NULL, 3501f4259b30SLisandro Dalcin NULL, 3502f4259b30SLisandro Dalcin NULL, 3503d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3504c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3505f4259b30SLisandro Dalcin NULL, 3506f4259b30SLisandro Dalcin NULL, 3507f4259b30SLisandro Dalcin NULL, 3508f4259b30SLisandro Dalcin /* 74*/ NULL, 35093acb8795SBarry Smith MatFDColoringApply_AIJ, 3510f4259b30SLisandro Dalcin NULL, 3511f4259b30SLisandro Dalcin NULL, 3512f4259b30SLisandro Dalcin NULL, 35136ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3514f4259b30SLisandro Dalcin NULL, 3515f4259b30SLisandro Dalcin NULL, 3516f4259b30SLisandro Dalcin NULL, 3517bc011b1eSHong Zhang MatLoad_SeqAIJ, 3518d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35191cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3520f4259b30SLisandro Dalcin NULL, 3521f4259b30SLisandro Dalcin NULL, 3522f4259b30SLisandro Dalcin NULL, 3523f4259b30SLisandro Dalcin /* 89*/ NULL, 3524f4259b30SLisandro Dalcin NULL, 352526be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3526f4259b30SLisandro Dalcin NULL, 3527f4259b30SLisandro Dalcin NULL, 35288fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3529f4259b30SLisandro Dalcin NULL, 3530f4259b30SLisandro Dalcin NULL, 35316fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3532f4259b30SLisandro Dalcin NULL, 35334222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3534f4259b30SLisandro Dalcin NULL, 3535f4259b30SLisandro Dalcin NULL, 353687d4246cSBarry Smith MatConjugate_SeqAIJ, 3537f4259b30SLisandro Dalcin NULL, 3538d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 353999cafbc1SBarry Smith MatRealPart_SeqAIJ, 3540f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3541f4259b30SLisandro Dalcin NULL, 3542f4259b30SLisandro Dalcin NULL, 3543cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3544f4259b30SLisandro Dalcin NULL, 35452af78befSBarry Smith MatGetRowMin_SeqAIJ, 3546f4259b30SLisandro Dalcin NULL, 3547599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3548f4259b30SLisandro Dalcin /*114*/ NULL, 3549f4259b30SLisandro Dalcin NULL, 3550f4259b30SLisandro Dalcin NULL, 3551f4259b30SLisandro Dalcin NULL, 3552f4259b30SLisandro Dalcin NULL, 3553f4259b30SLisandro Dalcin /*119*/ NULL, 3554f4259b30SLisandro Dalcin NULL, 3555f4259b30SLisandro Dalcin NULL, 3556f4259b30SLisandro Dalcin NULL, 3557b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 35580716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3559a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 356037868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 35610da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3562f4259b30SLisandro Dalcin NULL, 3563f4259b30SLisandro Dalcin /*129*/ NULL, 3564f4259b30SLisandro Dalcin NULL, 3565f4259b30SLisandro Dalcin NULL, 356675648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3567b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3568b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 35692b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3570f4259b30SLisandro Dalcin NULL, 3571f4259b30SLisandro Dalcin NULL, 35723964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3573f4259b30SLisandro Dalcin /*139*/ NULL, 3574f4259b30SLisandro Dalcin NULL, 3575f4259b30SLisandro Dalcin NULL, 35763a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 35779c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 35784222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 35794222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3580f4259b30SLisandro Dalcin NULL, 358172833a62Smarkadams4 NULL, 358272833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 35832d776b49SBarry Smith NULL, 35849371c9d4SSatish Balay /*150*/ MatTransposeSymbolic_SeqAIJ}; 358517ab2063SBarry Smith 3586d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3587d71ae5a4SJacob Faibussowitsch { 3588bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 358997f1f81fSBarry Smith PetscInt i, nz, n; 3590bef8e0ddSBarry Smith 3591bef8e0ddSBarry Smith PetscFunctionBegin; 3592bef8e0ddSBarry Smith nz = aij->maxnz; 3593d0f46423SBarry Smith n = mat->rmap->n; 3594ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3595bef8e0ddSBarry Smith aij->nz = nz; 3596ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 3597bef8e0ddSBarry Smith PetscFunctionReturn(0); 3598bef8e0ddSBarry Smith } 3599bef8e0ddSBarry Smith 3600a3bb6f32SFande Kong /* 3601ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3602ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3603ddea5d60SJunchao Zhang */ 3604d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3605d71ae5a4SJacob Faibussowitsch { 3606a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3607a3bb6f32SFande Kong PetscTable gid1_lid1; 3608a3bb6f32SFande Kong PetscTablePosition tpos; 360925b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 361025b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3611a3bb6f32SFande Kong 3612a3bb6f32SFande Kong PetscFunctionBegin; 3613a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3614a3bb6f32SFande Kong PetscValidPointer(mapping, 2); 3615a3bb6f32SFande Kong /* use a table */ 36169566063dSJacob Faibussowitsch PetscCall(PetscTableCreate(mat->rmap->n, mat->cmap->N + 1, &gid1_lid1)); 3617a3bb6f32SFande Kong ec = 0; 361825b670f0SStefano Zampini for (i = 0; i < nz; i++) { 361925b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 36209566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1, gid1, &data)); 3621a3bb6f32SFande Kong if (!data) { 3622a3bb6f32SFande Kong /* one based table */ 36239566063dSJacob Faibussowitsch PetscCall(PetscTableAdd(gid1_lid1, gid1, ++ec, INSERT_VALUES)); 3624a3bb6f32SFande Kong } 3625a3bb6f32SFande Kong } 3626a3bb6f32SFande Kong /* form array of columns we need */ 36279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 36289566063dSJacob Faibussowitsch PetscCall(PetscTableGetHeadPosition(gid1_lid1, &tpos)); 3629a3bb6f32SFande Kong while (tpos) { 36309566063dSJacob Faibussowitsch PetscCall(PetscTableGetNext(gid1_lid1, &tpos, &gid, &lid)); 3631a3bb6f32SFande Kong gid--; 3632a3bb6f32SFande Kong lid--; 3633a3bb6f32SFande Kong garray[lid] = gid; 3634a3bb6f32SFande Kong } 36359566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 36369566063dSJacob Faibussowitsch PetscCall(PetscTableRemoveAll(gid1_lid1)); 363748a46eb9SPierre Jolivet for (i = 0; i < ec; i++) PetscCall(PetscTableAdd(gid1_lid1, garray[i] + 1, i + 1, INSERT_VALUES)); 3638a3bb6f32SFande Kong /* compact out the extra columns in B */ 363925b670f0SStefano Zampini for (i = 0; i < nz; i++) { 364025b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 36419566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1, gid1, &lid)); 3642a3bb6f32SFande Kong lid--; 364325b670f0SStefano Zampini jj[i] = lid; 3644a3bb6f32SFande Kong } 36459566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 36469566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy(&gid1_lid1)); 36479566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36489566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36499566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 3650a3bb6f32SFande Kong PetscFunctionReturn(0); 3651a3bb6f32SFande Kong } 3652a3bb6f32SFande Kong 3653bef8e0ddSBarry Smith /*@ 3654bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3655bef8e0ddSBarry Smith in the matrix. 3656bef8e0ddSBarry Smith 3657bef8e0ddSBarry Smith Input Parameters: 365811a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3659bef8e0ddSBarry Smith - indices - the column indices 3660bef8e0ddSBarry Smith 366115091d37SBarry Smith Level: advanced 366215091d37SBarry Smith 3663bef8e0ddSBarry Smith Notes: 3664bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3665bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 366611a5261eSBarry Smith of the `MatSetValues()` operation. 3667bef8e0ddSBarry Smith 3668bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 366911a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3670bef8e0ddSBarry Smith 367111a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3672bef8e0ddSBarry Smith 3673b9617806SBarry Smith The indices should start with zero, not one. 3674b9617806SBarry Smith 3675bef8e0ddSBarry Smith @*/ 3676d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3677d71ae5a4SJacob Faibussowitsch { 3678bef8e0ddSBarry Smith PetscFunctionBegin; 36790700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3680dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 3681cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 3682bef8e0ddSBarry Smith PetscFunctionReturn(0); 3683bef8e0ddSBarry Smith } 3684bef8e0ddSBarry Smith 3685be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3686be6bf707SBarry Smith 3687d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3688d71ae5a4SJacob Faibussowitsch { 3689be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3690d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3691be6bf707SBarry Smith 3692be6bf707SBarry Smith PetscFunctionBegin; 369328b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3694be6bf707SBarry Smith 3695be6bf707SBarry Smith /* allocate space for values if not already there */ 36964dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3697be6bf707SBarry Smith 3698be6bf707SBarry Smith /* copy values over */ 36999566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 3700be6bf707SBarry Smith PetscFunctionReturn(0); 3701be6bf707SBarry Smith } 3702be6bf707SBarry Smith 3703be6bf707SBarry Smith /*@ 3704be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3705be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3706be6bf707SBarry Smith nonlinear portion. 3707be6bf707SBarry Smith 370811a5261eSBarry Smith Collect on mat 3709be6bf707SBarry Smith 3710be6bf707SBarry Smith Input Parameters: 371111a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3712be6bf707SBarry Smith 371315091d37SBarry Smith Level: advanced 371415091d37SBarry Smith 371511a5261eSBarry Smith Common Usage, with `SNESSolve()`: 3716be6bf707SBarry Smith $ Create Jacobian matrix 3717be6bf707SBarry Smith $ Set linear terms into matrix 3718be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3719be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3720be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3721512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3722be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3723be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3724be6bf707SBarry Smith $ In your Jacobian routine 3725be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3726be6bf707SBarry Smith $ Set nonlinear terms in matrix 3727be6bf707SBarry Smith 3728be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3729be6bf707SBarry Smith $ // build linear portion of Jacobian 3730512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3731be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3732be6bf707SBarry Smith $ loop over nonlinear iterations 3733be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3734be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3735be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3736be6bf707SBarry Smith $ Solve linear system with Jacobian 3737be6bf707SBarry Smith $ endloop 3738be6bf707SBarry Smith 3739be6bf707SBarry Smith Notes: 3740be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 374111a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3742be6bf707SBarry Smith calling this routine. 3743be6bf707SBarry Smith 37440c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37450c468ba9SBarry Smith and does not allocated additional space. 37460c468ba9SBarry Smith 3747db781477SPatrick Sanan .seealso: `MatRetrieveValues()` 3748be6bf707SBarry Smith @*/ 3749d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3750d71ae5a4SJacob Faibussowitsch { 3751be6bf707SBarry Smith PetscFunctionBegin; 37520700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 375328b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 375428b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3755cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 3756be6bf707SBarry Smith PetscFunctionReturn(0); 3757be6bf707SBarry Smith } 3758be6bf707SBarry Smith 3759d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3760d71ae5a4SJacob Faibussowitsch { 3761be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3762d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3763be6bf707SBarry Smith 3764be6bf707SBarry Smith PetscFunctionBegin; 376528b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 376628b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3767be6bf707SBarry Smith /* copy values over */ 37689566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 3769be6bf707SBarry Smith PetscFunctionReturn(0); 3770be6bf707SBarry Smith } 3771be6bf707SBarry Smith 3772be6bf707SBarry Smith /*@ 3773be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3774be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3775be6bf707SBarry Smith nonlinear portion. 3776be6bf707SBarry Smith 377711a5261eSBarry Smith Collect on mat 3778be6bf707SBarry Smith 3779be6bf707SBarry Smith Input Parameters: 378011a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3781be6bf707SBarry Smith 378215091d37SBarry Smith Level: advanced 378315091d37SBarry Smith 3784db781477SPatrick Sanan .seealso: `MatStoreValues()` 3785be6bf707SBarry Smith @*/ 3786d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3787d71ae5a4SJacob Faibussowitsch { 3788be6bf707SBarry Smith PetscFunctionBegin; 37890700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 379028b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 379128b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3792cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 3793be6bf707SBarry Smith PetscFunctionReturn(0); 3794be6bf707SBarry Smith } 3795be6bf707SBarry Smith 3796be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 379717ab2063SBarry Smith /*@C 379811a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 37990d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 38006e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 380151c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 38022bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 380317ab2063SBarry Smith 3804d083f849SBarry Smith Collective 3805db81eaa0SLois Curfman McInnes 380617ab2063SBarry Smith Input Parameters: 380711a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 380817ab2063SBarry Smith . m - number of rows 380917ab2063SBarry Smith . n - number of columns 381017ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 381151c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38120298fd71SBarry Smith (possibly different for each row) or NULL 381317ab2063SBarry Smith 381417ab2063SBarry Smith Output Parameter: 3815416022c9SBarry Smith . A - the matrix 381617ab2063SBarry Smith 381711a5261eSBarry Smith It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 3818f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 381911a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 3820175b88e8SBarry Smith 3821b259b22eSLois Curfman McInnes Notes: 382249a6f317SBarry Smith If nnz is given then nz is ignored 382349a6f317SBarry Smith 382411a5261eSBarry Smith The AIJ format, also called 382511a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 38260002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 382744cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 382817ab2063SBarry Smith 382917ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 383011a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 38313d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 38326da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 383317ab2063SBarry Smith 3834682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38354fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3836682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38376c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38386c7ebb05SLois Curfman McInnes 38396c7ebb05SLois Curfman McInnes Options Database Keys: 3840698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 38419db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 384217ab2063SBarry Smith 3843027ccd11SLois Curfman McInnes Level: intermediate 3844027ccd11SLois Curfman McInnes 384560161072SBarry Smith .seealso: [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 384617ab2063SBarry Smith @*/ 3847d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3848d71ae5a4SJacob Faibussowitsch { 38493a40ed3dSBarry Smith PetscFunctionBegin; 38509566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38519566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38529566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 3854273d9f13SBarry Smith PetscFunctionReturn(0); 3855273d9f13SBarry Smith } 3856273d9f13SBarry Smith 3857273d9f13SBarry Smith /*@C 3858273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3859273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3860273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3861273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3862273d9f13SBarry Smith 3863d083f849SBarry Smith Collective 3864273d9f13SBarry Smith 3865273d9f13SBarry Smith Input Parameters: 38661c4f3114SJed Brown + B - The matrix 3867273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3868273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38690298fd71SBarry Smith (possibly different for each row) or NULL 3870273d9f13SBarry Smith 3871273d9f13SBarry Smith Notes: 387249a6f317SBarry Smith If nnz is given then nz is ignored 387349a6f317SBarry Smith 387411a5261eSBarry Smith The `MATSEQAIJ` format also called 387511a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 3876273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3877273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3878273d9f13SBarry Smith 3879273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 388011a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 3881273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3882273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3883273d9f13SBarry Smith 388411a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3885aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3886aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3887aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3888aa95bbe8SBarry Smith 388911a5261eSBarry Smith Developer Notes: 389011a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3891a96a251dSBarry Smith entries or columns indices 3892a96a251dSBarry Smith 3893273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3894273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3895273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3896273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3897273d9f13SBarry Smith 3898273d9f13SBarry Smith Options Database Keys: 3899698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 390047b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3901273d9f13SBarry Smith 3902273d9f13SBarry Smith Level: intermediate 3903273d9f13SBarry Smith 3904db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3905db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3906273d9f13SBarry Smith @*/ 3907d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3908d71ae5a4SJacob Faibussowitsch { 3909a23d5eceSKris Buschelman PetscFunctionBegin; 39106ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39116ba663aaSJed Brown PetscValidType(B, 1); 3912cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 3913a23d5eceSKris Buschelman PetscFunctionReturn(0); 3914a23d5eceSKris Buschelman } 3915a23d5eceSKris Buschelman 3916d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3917d71ae5a4SJacob Faibussowitsch { 3918273d9f13SBarry Smith Mat_SeqAIJ *b; 39192576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 392097f1f81fSBarry Smith PetscInt i; 3921273d9f13SBarry Smith 3922273d9f13SBarry Smith PetscFunctionBegin; 39232576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3924a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3925c461c341SBarry Smith skipallocation = PETSC_TRUE; 3926c461c341SBarry Smith nz = 0; 3927c461c341SBarry Smith } 39289566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39299566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3930899cda47SBarry Smith 3931435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 393208401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 3933cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3934d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 393508401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 393608401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3937b73539f3SBarry Smith } 3938b73539f3SBarry Smith } 3939b73539f3SBarry Smith 3940273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 39412205254eSKarl Rupp 3942273d9f13SBarry Smith b = (Mat_SeqAIJ *)B->data; 3943273d9f13SBarry Smith 3944ab93d7beSBarry Smith if (!skipallocation) { 39454dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3946071fcb05SBarry Smith if (!b->ilen) { 3947071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39489566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3949071fcb05SBarry Smith } else { 39509566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39512ee49352SLisandro Dalcin } 39524dfa11a4SJacob Faibussowitsch if (!b->ipre) { PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); } 3953273d9f13SBarry Smith if (!nnz) { 3954435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3955c62bd62aSJed Brown else if (nz < 0) nz = 1; 39565d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 3957d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 3958d0f46423SBarry Smith nz = nz * B->rmap->n; 3959273d9f13SBarry Smith } else { 3960c73702f5SBarry Smith PetscInt64 nz64 = 0; 39619371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 39629371c9d4SSatish Balay b->imax[i] = nnz[i]; 39639371c9d4SSatish Balay nz64 += nnz[i]; 39649371c9d4SSatish Balay } 39659566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 3966273d9f13SBarry Smith } 3967ab93d7beSBarry Smith 3968273d9f13SBarry Smith /* allocate the matrix space */ 396953dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 39709566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 3971396832f4SHong Zhang if (B->structure_only) { 39729566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &b->j)); 39739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i)); 3974396832f4SHong Zhang } else { 39759566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i)); 3976396832f4SHong Zhang } 3977bfeeae90SHong Zhang b->i[0] = 0; 3978ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 3979396832f4SHong Zhang if (B->structure_only) { 3980396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 3981396832f4SHong Zhang b->free_a = PETSC_FALSE; 3982396832f4SHong Zhang } else { 3983273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 3984e6b907acSBarry Smith b->free_a = PETSC_TRUE; 3985396832f4SHong Zhang } 3986e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 3987c461c341SBarry Smith } else { 3988e6b907acSBarry Smith b->free_a = PETSC_FALSE; 3989e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 3990c461c341SBarry Smith } 3991273d9f13SBarry Smith 3992846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 3993846b4da1SFande Kong /* reserve user-requested sparsity */ 39949566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 3995846b4da1SFande Kong } 3996846b4da1SFande Kong 3997273d9f13SBarry Smith b->nz = 0; 3998273d9f13SBarry Smith b->maxnz = nz; 3999273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40001baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4001cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4002cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40035519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40045519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40055519a089SJose E. Roman */ 40065519a089SJose E. Roman B->nonzerostate++; 4007273d9f13SBarry Smith PetscFunctionReturn(0); 4008273d9f13SBarry Smith } 4009273d9f13SBarry Smith 4010d71ae5a4SJacob Faibussowitsch PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4011d71ae5a4SJacob Faibussowitsch { 4012846b4da1SFande Kong Mat_SeqAIJ *a; 4013a5bbaf83SFande Kong PetscInt i; 4014846b4da1SFande Kong 4015846b4da1SFande Kong PetscFunctionBegin; 4016846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 401714d0e64fSAlex Lindsay 401814d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 401914d0e64fSAlex Lindsay if (!A->rmap->n) PetscFunctionReturn(0); 402014d0e64fSAlex Lindsay 4021846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40222c814fdeSFande Kong /* if no saved info, we error out */ 402328b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40242c814fdeSFande Kong 4025aed4548fSBarry Smith PetscCheck(a->i && a->j && a->a && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40262c814fdeSFande Kong 40279566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40289566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4029846b4da1SFande Kong a->i[0] = 0; 4030ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4031846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4032846b4da1SFande Kong a->nz = 0; 4033846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4034846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4035846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4036846b4da1SFande Kong A->assembled = PETSC_FALSE; 4037846b4da1SFande Kong PetscFunctionReturn(0); 4038846b4da1SFande Kong } 4039846b4da1SFande Kong 404058d36128SBarry Smith /*@ 404111a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4042a1661176SMatthew Knepley 4043a1661176SMatthew Knepley Input Parameters: 4044a1661176SMatthew Knepley + B - the matrix 4045a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4046a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4047a1661176SMatthew Knepley - v - optional values in the matrix 4048a1661176SMatthew Knepley 4049a1661176SMatthew Knepley Level: developer 4050a1661176SMatthew Knepley 40516a9b8d82SBarry Smith Notes: 405211a5261eSBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 405358d36128SBarry Smith 40546a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 40556a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 40566a9b8d82SBarry Smith 40576a9b8d82SBarry Smith Developer Notes: 40586a9b8d82SBarry Smith An optimization could be added to the implementation where it checks if the i, and j are identical to the current i and j and 405911a5261eSBarry Smith then just copies the v values directly with `PetscMemcpy()`. 40606a9b8d82SBarry Smith 406111a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 40626a9b8d82SBarry Smith 4063db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MatResetPreallocation()` 4064a1661176SMatthew Knepley @*/ 4065d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4066d71ae5a4SJacob Faibussowitsch { 4067a1661176SMatthew Knepley PetscFunctionBegin; 40680700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 40696ba663aaSJed Brown PetscValidType(B, 1); 4070cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 4071a1661176SMatthew Knepley PetscFunctionReturn(0); 4072a1661176SMatthew Knepley } 4073a1661176SMatthew Knepley 4074d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4075d71ae5a4SJacob Faibussowitsch { 4076a1661176SMatthew Knepley PetscInt i; 4077a1661176SMatthew Knepley PetscInt m, n; 4078a1661176SMatthew Knepley PetscInt nz; 40796a9b8d82SBarry Smith PetscInt *nnz; 4080a1661176SMatthew Knepley 4081a1661176SMatthew Knepley PetscFunctionBegin; 4082aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4083779a8d59SSatish Balay 40849566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 40859566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4086779a8d59SSatish Balay 40879566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 40889566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4089a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4090b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 409108401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4092a1661176SMatthew Knepley nnz[i] = nz; 4093a1661176SMatthew Knepley } 40949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 40959566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4096a1661176SMatthew Knepley 409748a46eb9SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES)); 4098a1661176SMatthew Knepley 40999566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41009566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4101a1661176SMatthew Knepley 41029566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 4103a1661176SMatthew Knepley PetscFunctionReturn(0); 4104a1661176SMatthew Knepley } 4105a1661176SMatthew Knepley 4106ad7e164aSPierre Jolivet /*@ 4107ad7e164aSPierre Jolivet MatSeqAIJKron - Computes C, the Kronecker product of A and B. 4108ad7e164aSPierre Jolivet 4109ad7e164aSPierre Jolivet Input Parameters: 4110ad7e164aSPierre Jolivet + A - left-hand side matrix 4111ad7e164aSPierre Jolivet . B - right-hand side matrix 411211a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4113ad7e164aSPierre Jolivet 4114ad7e164aSPierre Jolivet Output Parameter: 4115ad7e164aSPierre Jolivet . C - Kronecker product of A and B 4116ad7e164aSPierre Jolivet 4117ad7e164aSPierre Jolivet Level: intermediate 4118ad7e164aSPierre Jolivet 411911a5261eSBarry Smith Note: 412011a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4121ad7e164aSPierre Jolivet 4122db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4123ad7e164aSPierre Jolivet @*/ 4124d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4125d71ae5a4SJacob Faibussowitsch { 4126ad7e164aSPierre Jolivet PetscFunctionBegin; 4127ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4128ad7e164aSPierre Jolivet PetscValidType(A, 1); 4129ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4130ad7e164aSPierre Jolivet PetscValidType(B, 2); 4131ad7e164aSPierre Jolivet PetscValidPointer(C, 4); 4132ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4133ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4134ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4135ad7e164aSPierre Jolivet } 4136cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 4137ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4138ad7e164aSPierre Jolivet } 4139ad7e164aSPierre Jolivet 4140d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4141d71ae5a4SJacob Faibussowitsch { 4142ad7e164aSPierre Jolivet Mat newmat; 4143ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4144ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4145ad7e164aSPierre Jolivet PetscScalar *v; 4146fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4147ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4148ad7e164aSPierre Jolivet PetscBool flg; 4149ad7e164aSPierre Jolivet 4150ad7e164aSPierre Jolivet PetscFunctionBegin; 415128b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 415228b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 415328b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 415428b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 41559566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 415628b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4157aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4158ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 41599566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 41609566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 41619566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 41629566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4163ad7e164aSPierre Jolivet i[0] = 0; 4164ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4165ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4166ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4167ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4168ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4169ad7e164aSPierre Jolivet } 4170ad7e164aSPierre Jolivet } 4171ad7e164aSPierre Jolivet } 41729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4173ad7e164aSPierre Jolivet *C = newmat; 41749566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4175ad7e164aSPierre Jolivet nnz = 0; 4176ad7e164aSPierre Jolivet } 41779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 41789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 41799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4180ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4181ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4182ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4183ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4184ad7e164aSPierre Jolivet } 4185ad7e164aSPierre Jolivet } 4186ad7e164aSPierre Jolivet } 41879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 41889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 41899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 4190ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4191ad7e164aSPierre Jolivet } 4192ad7e164aSPierre Jolivet 4193c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4194af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4195170fe5c8SBarry Smith 4196170fe5c8SBarry Smith /* 4197170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4198170fe5c8SBarry Smith 4199170fe5c8SBarry Smith n p p 42002da392ccSBarry Smith [ ] [ ] [ ] 42012da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42022da392ccSBarry Smith [ ] [ ] [ ] 4203170fe5c8SBarry Smith 4204170fe5c8SBarry Smith */ 4205d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4206d71ae5a4SJacob Faibussowitsch { 4207170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4208170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4209170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 421086214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4211170fe5c8SBarry Smith const PetscInt *ii, *idx; 4212170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4213170fe5c8SBarry Smith PetscScalar *c, *c_q; 421486214ceeSStefano Zampini PetscInt clda = sub_c->lda; 421586214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4216170fe5c8SBarry Smith 4217170fe5c8SBarry Smith PetscFunctionBegin; 4218d0f46423SBarry Smith m = A->rmap->n; 4219d0f46423SBarry Smith n = A->cmap->n; 4220d0f46423SBarry Smith p = B->cmap->n; 4221170fe5c8SBarry Smith a = sub_a->v; 4222170fe5c8SBarry Smith b = sub_b->a; 4223170fe5c8SBarry Smith c = sub_c->v; 422486214ceeSStefano Zampini if (clda == m) { 42259566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 422686214ceeSStefano Zampini } else { 422786214ceeSStefano Zampini for (j = 0; j < p; j++) 42289371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 422986214ceeSStefano Zampini } 4230170fe5c8SBarry Smith ii = sub_b->i; 4231170fe5c8SBarry Smith idx = sub_b->j; 4232170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4233170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4234170fe5c8SBarry Smith while (q-- > 0) { 423586214ceeSStefano Zampini c_q = c + clda * (*idx); 423686214ceeSStefano Zampini a_q = a + alda * i; 4237854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4238170fe5c8SBarry Smith idx++; 4239170fe5c8SBarry Smith b++; 4240170fe5c8SBarry Smith } 4241170fe5c8SBarry Smith } 4242170fe5c8SBarry Smith PetscFunctionReturn(0); 4243170fe5c8SBarry Smith } 4244170fe5c8SBarry Smith 4245d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4246d71ae5a4SJacob Faibussowitsch { 4247d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 424886214ceeSStefano Zampini PetscBool cisdense; 4249170fe5c8SBarry Smith 4250170fe5c8SBarry Smith PetscFunctionBegin; 425108401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 42529566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 42539566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 42549566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, "")); 425548a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 42569566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4257d73949e8SHong Zhang 42584222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 4259170fe5c8SBarry Smith PetscFunctionReturn(0); 4260170fe5c8SBarry Smith } 4261170fe5c8SBarry Smith 4262170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 42630bad9183SKris Buschelman /*MC 4264fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 42650bad9183SKris Buschelman based on compressed sparse row format. 42660bad9183SKris Buschelman 42670bad9183SKris Buschelman Options Database Keys: 42680bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 42690bad9183SKris Buschelman 42700bad9183SKris Buschelman Level: beginner 42710bad9183SKris Buschelman 42720cd7f59aSBarry Smith Notes: 427311a5261eSBarry Smith `MatSetValues()` may be called for this matrix type with a NULL argument for the numerical values, 42740cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 42750cd7f59aSBarry Smith in the matrix 42760cd7f59aSBarry Smith 427711a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 427811a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 42790cd7f59aSBarry Smith 428011a5261eSBarry Smith Developer Note: 42810cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 42820cd7f59aSBarry Smith 4283db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 42840bad9183SKris Buschelman M*/ 42850bad9183SKris Buschelman 4286ccd284c7SBarry Smith /*MC 4287ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4288ccd284c7SBarry Smith 428911a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 429011a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 429111a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4292ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4293ccd284c7SBarry Smith the above preallocation routines for simplicity. 4294ccd284c7SBarry Smith 4295ccd284c7SBarry Smith Options Database Keys: 429611a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4297ccd284c7SBarry Smith 429811a5261eSBarry Smith Note: 429911a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4300ccd284c7SBarry Smith enough exist. 4301ccd284c7SBarry Smith 4302ccd284c7SBarry Smith Level: beginner 4303ccd284c7SBarry Smith 4304db781477SPatrick Sanan .seealso: `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4305ccd284c7SBarry Smith M*/ 4306ccd284c7SBarry Smith 4307ccd284c7SBarry Smith /*MC 4308ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4309ccd284c7SBarry Smith 431011a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 431111a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 431211a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4313ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4314ccd284c7SBarry Smith the above preallocation routines for simplicity. 4315ccd284c7SBarry Smith 4316ccd284c7SBarry Smith Options Database Keys: 431711a5261eSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 4318ccd284c7SBarry Smith 4319ccd284c7SBarry Smith Level: beginner 4320ccd284c7SBarry Smith 4321c2e3fba1SPatrick Sanan .seealso: `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4322ccd284c7SBarry Smith M*/ 4323ccd284c7SBarry Smith 43247906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43257906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43267906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43277906f579SHong Zhang #endif 4328d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4329d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4330d24d4204SJose E. Roman #endif 43317906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43327906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43337906f579SHong Zhang #endif 43347906f579SHong Zhang 4335d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4336c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43374222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43387906f579SHong Zhang 43398c778c55SBarry Smith /*@C 434011a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43418c778c55SBarry Smith 43428c778c55SBarry Smith Not Collective 43438c778c55SBarry Smith 43448c778c55SBarry Smith Input Parameter: 434511a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 43468c778c55SBarry Smith 43478c778c55SBarry Smith Output Parameter: 43488c778c55SBarry Smith . array - pointer to the data 43498c778c55SBarry Smith 43508c778c55SBarry Smith Level: intermediate 43518c778c55SBarry Smith 4352db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 43538c778c55SBarry Smith @*/ 4354d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array) 4355d71ae5a4SJacob Faibussowitsch { 4356d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 43578c778c55SBarry Smith 43588c778c55SBarry Smith PetscFunctionBegin; 4359d67d9f35SJunchao Zhang if (aij->ops->getarray) { 43609566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4361d67d9f35SJunchao Zhang } else { 4362d67d9f35SJunchao Zhang *array = aij->a; 4363d67d9f35SJunchao Zhang } 4364d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4365d67d9f35SJunchao Zhang } 4366d67d9f35SJunchao Zhang 4367d67d9f35SJunchao Zhang /*@C 436811a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4369d67d9f35SJunchao Zhang 4370d67d9f35SJunchao Zhang Not Collective 4371d67d9f35SJunchao Zhang 4372d67d9f35SJunchao Zhang Input Parameters: 437311a5261eSBarry Smith + mat - a `MATSEQAIJ` matrix 4374d67d9f35SJunchao Zhang - array - pointer to the data 4375d67d9f35SJunchao Zhang 4376d67d9f35SJunchao Zhang Level: intermediate 4377d67d9f35SJunchao Zhang 4378db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4379d67d9f35SJunchao Zhang @*/ 4380d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array) 4381d71ae5a4SJacob Faibussowitsch { 4382d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4383d67d9f35SJunchao Zhang 4384d67d9f35SJunchao Zhang PetscFunctionBegin; 4385d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 43869566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4387d67d9f35SJunchao Zhang } else { 4388d67d9f35SJunchao Zhang *array = NULL; 4389d67d9f35SJunchao Zhang } 43909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 43919566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 43928c778c55SBarry Smith PetscFunctionReturn(0); 43938c778c55SBarry Smith } 43948c778c55SBarry Smith 439521e72a00SBarry Smith /*@C 439611a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 43978f1ea47aSStefano Zampini 43988f1ea47aSStefano Zampini Not Collective 43998f1ea47aSStefano Zampini 44008f1ea47aSStefano Zampini Input Parameter: 440111a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44028f1ea47aSStefano Zampini 44038f1ea47aSStefano Zampini Output Parameter: 44048f1ea47aSStefano Zampini . array - pointer to the data 44058f1ea47aSStefano Zampini 44068f1ea47aSStefano Zampini Level: intermediate 44078f1ea47aSStefano Zampini 4408db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44098f1ea47aSStefano Zampini @*/ 4410d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array) 4411d71ae5a4SJacob Faibussowitsch { 4412d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44138f1ea47aSStefano Zampini 44148f1ea47aSStefano Zampini PetscFunctionBegin; 4415d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44169566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4417d67d9f35SJunchao Zhang } else { 4418d67d9f35SJunchao Zhang *array = aij->a; 4419d67d9f35SJunchao Zhang } 44208f1ea47aSStefano Zampini PetscFunctionReturn(0); 44218f1ea47aSStefano Zampini } 44228f1ea47aSStefano Zampini 44238f1ea47aSStefano Zampini /*@C 442411a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44258f1ea47aSStefano Zampini 44268f1ea47aSStefano Zampini Not Collective 44278f1ea47aSStefano Zampini 44288f1ea47aSStefano Zampini Input Parameter: 442911a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44308f1ea47aSStefano Zampini 44318f1ea47aSStefano Zampini Output Parameter: 44328f1ea47aSStefano Zampini . array - pointer to the data 44338f1ea47aSStefano Zampini 44348f1ea47aSStefano Zampini Level: intermediate 44358f1ea47aSStefano Zampini 4436db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44378f1ea47aSStefano Zampini @*/ 4438d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array) 4439d71ae5a4SJacob Faibussowitsch { 4440d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44418f1ea47aSStefano Zampini 44428f1ea47aSStefano Zampini PetscFunctionBegin; 4443d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44449566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4445d67d9f35SJunchao Zhang } else { 4446d67d9f35SJunchao Zhang *array = NULL; 4447d67d9f35SJunchao Zhang } 4448d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4449d67d9f35SJunchao Zhang } 4450d67d9f35SJunchao Zhang 4451d67d9f35SJunchao Zhang /*@C 445211a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4453d67d9f35SJunchao Zhang 4454d67d9f35SJunchao Zhang Not Collective 4455d67d9f35SJunchao Zhang 4456d67d9f35SJunchao Zhang Input Parameter: 445711a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 4458d67d9f35SJunchao Zhang 4459d67d9f35SJunchao Zhang Output Parameter: 4460d67d9f35SJunchao Zhang . array - pointer to the data 4461d67d9f35SJunchao Zhang 4462d67d9f35SJunchao Zhang Level: intermediate 4463d67d9f35SJunchao Zhang 4464db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4465d67d9f35SJunchao Zhang @*/ 4466d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array) 4467d71ae5a4SJacob Faibussowitsch { 4468d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4469d67d9f35SJunchao Zhang 4470d67d9f35SJunchao Zhang PetscFunctionBegin; 4471d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 44729566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4473d67d9f35SJunchao Zhang } else { 4474d67d9f35SJunchao Zhang *array = aij->a; 4475d67d9f35SJunchao Zhang } 44769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44779566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 4478d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4479d67d9f35SJunchao Zhang } 4480d67d9f35SJunchao Zhang 4481d67d9f35SJunchao Zhang /*@C 4482d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4483d67d9f35SJunchao Zhang 4484d67d9f35SJunchao Zhang Not Collective 4485d67d9f35SJunchao Zhang 4486d67d9f35SJunchao Zhang Input Parameter: 4487d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4488d67d9f35SJunchao Zhang 4489d67d9f35SJunchao Zhang Output Parameter: 4490d67d9f35SJunchao Zhang . array - pointer to the data 4491d67d9f35SJunchao Zhang 4492d67d9f35SJunchao Zhang Level: intermediate 4493d67d9f35SJunchao Zhang 4494db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4495d67d9f35SJunchao Zhang @*/ 4496d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array) 4497d71ae5a4SJacob Faibussowitsch { 4498d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4499d67d9f35SJunchao Zhang 4500d67d9f35SJunchao Zhang PetscFunctionBegin; 4501d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45029566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4503d67d9f35SJunchao Zhang } else { 4504d67d9f35SJunchao Zhang *array = NULL; 4505d67d9f35SJunchao Zhang } 45068f1ea47aSStefano Zampini PetscFunctionReturn(0); 45078f1ea47aSStefano Zampini } 45088f1ea47aSStefano Zampini 45098f1ea47aSStefano Zampini /*@C 451011a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45117ee59b9bSJunchao Zhang 45127ee59b9bSJunchao Zhang Not Collective 45137ee59b9bSJunchao Zhang 45147ee59b9bSJunchao Zhang Input Parameter: 451511a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45167ee59b9bSJunchao Zhang 45177ee59b9bSJunchao Zhang Output Parameters: 45187ee59b9bSJunchao Zhang + i - row map array of the matrix 45197ee59b9bSJunchao Zhang . j - column index array of the matrix 45207ee59b9bSJunchao Zhang . a - data array of the matrix 45217ee59b9bSJunchao Zhang - memtype - memory type of the arrays 45227ee59b9bSJunchao Zhang 45237ee59b9bSJunchao Zhang Notes: 45247ee59b9bSJunchao Zhang Any of the output parameters can be NULL, in which case the corresponding value is not returned. 45257ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45267ee59b9bSJunchao Zhang 45277ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45287ee59b9bSJunchao Zhang If the matrix is assembled, the data array 'a' is guaranteed to have the latest values of the matrix. 45297ee59b9bSJunchao Zhang 45307ee59b9bSJunchao Zhang Level: Developer 45317ee59b9bSJunchao Zhang 4532db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45337ee59b9bSJunchao Zhang @*/ 4534d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype) 4535d71ae5a4SJacob Faibussowitsch { 45367ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45377ee59b9bSJunchao Zhang 45387ee59b9bSJunchao Zhang PetscFunctionBegin; 45397ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45407ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45417ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45427ee59b9bSJunchao Zhang } else { 45437ee59b9bSJunchao Zhang if (i) *i = aij->i; 45447ee59b9bSJunchao Zhang if (j) *j = aij->j; 45457ee59b9bSJunchao Zhang if (a) *a = aij->a; 45467ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 45477ee59b9bSJunchao Zhang } 45487ee59b9bSJunchao Zhang PetscFunctionReturn(0); 45497ee59b9bSJunchao Zhang } 45507ee59b9bSJunchao Zhang 45517ee59b9bSJunchao Zhang /*@C 455221e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 455321e72a00SBarry Smith 455421e72a00SBarry Smith Not Collective 455521e72a00SBarry Smith 455621e72a00SBarry Smith Input Parameter: 455711a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 455821e72a00SBarry Smith 455921e72a00SBarry Smith Output Parameter: 456021e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 456121e72a00SBarry Smith 456221e72a00SBarry Smith Level: intermediate 456321e72a00SBarry Smith 4564db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 456521e72a00SBarry Smith @*/ 4566d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4567d71ae5a4SJacob Faibussowitsch { 456821e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 456921e72a00SBarry Smith 457021e72a00SBarry Smith PetscFunctionBegin; 457121e72a00SBarry Smith *nz = aij->rmax; 457221e72a00SBarry Smith PetscFunctionReturn(0); 457321e72a00SBarry Smith } 457421e72a00SBarry Smith 4575d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4576d71ae5a4SJacob Faibussowitsch { 4577394ed5ebSJunchao Zhang MPI_Comm comm; 4578394ed5ebSJunchao Zhang PetscInt *i, *j; 4579394ed5ebSJunchao Zhang PetscInt M, N, row; 4580394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4581394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4582394ed5ebSJunchao Zhang PetscInt *Aj; 4583394ed5ebSJunchao Zhang PetscScalar *Aa; 4584cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)(mat->data); 4585cbc6b225SStefano Zampini MatType rtype; 4586394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 4587394ed5ebSJunchao Zhang 4588394ed5ebSJunchao Zhang PetscFunctionBegin; 45899566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(mat)); 45909566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 45919566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4592e8729f6fSJunchao Zhang i = coo_i; 4593e8729f6fSJunchao Zhang j = coo_j; 45949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 4595394ed5ebSJunchao Zhang for (k = 0; k < coo_n; k++) { /* Ignore entries with negative row or col indices */ 4596394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4597394ed5ebSJunchao Zhang perm[k] = k; 4598394ed5ebSJunchao Zhang } 4599394ed5ebSJunchao Zhang 4600394ed5ebSJunchao Zhang /* Sort by row */ 46019566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 46029371c9d4SSatish Balay for (k = 0; k < coo_n; k++) { 46039371c9d4SSatish Balay if (i[k] >= 0) break; 46049371c9d4SSatish Balay } /* Advance k to the first row with a non-negative index */ 4605394ed5ebSJunchao Zhang nneg = k; 46069566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4607394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 4608394ed5ebSJunchao Zhang jmap++; /* Inc jmap by 1 for convinience */ 4609394ed5ebSJunchao Zhang 46109566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M + 1, &Ai)); /* CSR of A */ 46119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4612394ed5ebSJunchao Zhang 4613394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 4614394ed5ebSJunchao Zhang Ai++; /* Inc by 1 for convinience */ 4615394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4616394ed5ebSJunchao Zhang while (k < coo_n) { 4617394ed5ebSJunchao Zhang row = i[k]; 4618394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4619394ed5ebSJunchao Zhang while (k < coo_n && i[k] == row) k++; 4620394ed5ebSJunchao Zhang end = k; 46219566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4622394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4623394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4624394ed5ebSJunchao Zhang jmap[q] = 1; /* Number of repeats of this nozero entry */ 4625394ed5ebSJunchao Zhang Ai[row] = 1; 4626394ed5ebSJunchao Zhang nnz++; 4627394ed5ebSJunchao Zhang 4628394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4629394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4630394ed5ebSJunchao Zhang q++; 4631394ed5ebSJunchao Zhang jmap[q] = 1; 4632394ed5ebSJunchao Zhang Aj[q] = j[p]; 4633394ed5ebSJunchao Zhang Ai[row]++; 4634394ed5ebSJunchao Zhang nnz++; 4635394ed5ebSJunchao Zhang } else { 4636394ed5ebSJunchao Zhang jmap[q]++; 4637394ed5ebSJunchao Zhang } 4638394ed5ebSJunchao Zhang } 4639394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4640394ed5ebSJunchao Zhang } 4641394ed5ebSJunchao Zhang 4642394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4643394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 4644394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4645394ed5ebSJunchao Zhang jmap[0] = 0; 4646394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 4647394ed5ebSJunchao Zhang if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */ 4648394ed5ebSJunchao Zhang PetscCount *jmap_new; 4649394ed5ebSJunchao Zhang PetscInt *Aj_new; 4650394ed5ebSJunchao Zhang 46519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 46529566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 46539566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4654394ed5ebSJunchao Zhang jmap = jmap_new; 4655394ed5ebSJunchao Zhang 46569566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &Aj_new)); 46579566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 46589566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4659394ed5ebSJunchao Zhang Aj = Aj_new; 4660394ed5ebSJunchao Zhang } 4661394ed5ebSJunchao Zhang 4662394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4663394ed5ebSJunchao Zhang PetscCount *perm_new; 4664cbc6b225SStefano Zampini 46659566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 46669566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 46679566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4668394ed5ebSJunchao Zhang perm = perm_new; 4669394ed5ebSJunchao Zhang } 4670394ed5ebSJunchao Zhang 46719566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 46729566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */ 46739566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4674394ed5ebSJunchao Zhang 4675394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4676394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 4677394ed5ebSJunchao Zhang /* Record COO fields */ 4678394ed5ebSJunchao Zhang seqaij->coo_n = coo_n; 4679394ed5ebSJunchao Zhang seqaij->Atot = coo_n - nneg; /* Annz is seqaij->nz, so no need to record that again */ 4680394ed5ebSJunchao Zhang seqaij->jmap = jmap; /* of length nnz+1 */ 4681394ed5ebSJunchao Zhang seqaij->perm = perm; 4682394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4683394ed5ebSJunchao Zhang } 4684394ed5ebSJunchao Zhang 4685d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4686d71ae5a4SJacob Faibussowitsch { 4687394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4688394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 4689394ed5ebSJunchao Zhang PetscCount *perm = aseq->perm, *jmap = aseq->jmap; 4690394ed5ebSJunchao Zhang PetscScalar *Aa; 4691394ed5ebSJunchao Zhang 4692394ed5ebSJunchao Zhang PetscFunctionBegin; 46939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4694394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4695b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4696b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4697b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4698394ed5ebSJunchao Zhang } 46999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 4700394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4701394ed5ebSJunchao Zhang } 4702394ed5ebSJunchao Zhang 470334b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47045063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 470502fe1965SBarry Smith #endif 47063d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47075063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 47083d0639e7SStefano Zampini #endif 470902fe1965SBarry Smith 4710d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4711d71ae5a4SJacob Faibussowitsch { 4712273d9f13SBarry Smith Mat_SeqAIJ *b; 471338baddfdSBarry Smith PetscMPIInt size; 4714273d9f13SBarry Smith 4715273d9f13SBarry Smith PetscFunctionBegin; 47169566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 471708401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4718273d9f13SBarry Smith 47194dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 47202205254eSKarl Rupp 4721b0a32e0cSBarry Smith B->data = (void *)b; 47222205254eSKarl Rupp 47239566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps))); 4724071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 47252205254eSKarl Rupp 4726f4259b30SLisandro Dalcin b->row = NULL; 4727f4259b30SLisandro Dalcin b->col = NULL; 4728f4259b30SLisandro Dalcin b->icol = NULL; 4729b810aeb4SBarry Smith b->reallocs = 0; 473036db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4731f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4732416022c9SBarry Smith b->nonew = 0; 4733f4259b30SLisandro Dalcin b->diag = NULL; 4734f4259b30SLisandro Dalcin b->solve_work = NULL; 4735f4259b30SLisandro Dalcin B->spptr = NULL; 4736f4259b30SLisandro Dalcin b->saved_values = NULL; 4737f4259b30SLisandro Dalcin b->idiag = NULL; 4738f4259b30SLisandro Dalcin b->mdiag = NULL; 4739f4259b30SLisandro Dalcin b->ssor_work = NULL; 474071f1c65dSBarry Smith b->omega = 1.0; 474171f1c65dSBarry Smith b->fshift = 0.0; 474271f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4743bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4744a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 474517ab2063SBarry Smith 47469566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4747d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 47489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 47499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4750b3866ffcSBarry Smith #endif 47519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 47529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 47539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 47549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 47559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 47569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 47579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 47589779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 47599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4760191b95cbSRichard Tran Mills #endif 476134b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 47639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 47649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 476502fe1965SBarry Smith #endif 47663d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 47683d0639e7SStefano Zampini #endif 47699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4770af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 47719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4772af8000cdSHong Zhang #endif 4773d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 47749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4775d24d4204SJose E. Roman #endif 477663c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 47779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 47789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 477963c07aadSStefano Zampini #endif 47809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 47819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 47829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 47839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 47849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsTranspose_SeqAIJ)); 47859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 47869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 47879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 47889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 47899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 47909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 47919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 47929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 47939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 47949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 47959566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 47969566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 47979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 47983a40ed3dSBarry Smith PetscFunctionReturn(0); 479917ab2063SBarry Smith } 480017ab2063SBarry Smith 4801b24902e0SBarry Smith /* 48023893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4803b24902e0SBarry Smith */ 4804d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4805d71ae5a4SJacob Faibussowitsch { 48062a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4807071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 480817ab2063SBarry Smith 48093a40ed3dSBarry Smith PetscFunctionBegin; 4810aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4811273d9f13SBarry Smith 4812d5f3da31SBarry Smith C->factortype = A->factortype; 4813f4259b30SLisandro Dalcin c->row = NULL; 4814f4259b30SLisandro Dalcin c->col = NULL; 4815f4259b30SLisandro Dalcin c->icol = NULL; 48166ad4291fSHong Zhang c->reallocs = 0; 481717ab2063SBarry Smith 481869272f91SPierre Jolivet C->assembled = A->assembled; 481969272f91SPierre Jolivet C->preallocated = A->preallocated; 482017ab2063SBarry Smith 482169272f91SPierre Jolivet if (A->preallocated) { 48229566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 48239566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4824eec197d1SBarry Smith 48259566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 48269566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 48279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 48289566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 482917ab2063SBarry Smith 483017ab2063SBarry Smith /* allocate the matrix space */ 4831f77e22a1SHong Zhang if (mallocmatspace) { 48329566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i)); 48332205254eSKarl Rupp 4834f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 48352205254eSKarl Rupp 48369566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 483717ab2063SBarry Smith if (m > 0) { 48389566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4839be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 48402e5835c6SStefano Zampini const PetscScalar *aa; 48412e5835c6SStefano Zampini 48429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 48439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 48449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 4845be6bf707SBarry Smith } else { 48469566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 484717ab2063SBarry Smith } 484808480c60SBarry Smith } 4849f77e22a1SHong Zhang } 485017ab2063SBarry Smith 48516ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4852416022c9SBarry Smith c->roworiented = a->roworiented; 4853416022c9SBarry Smith c->nonew = a->nonew; 4854416022c9SBarry Smith if (a->diag) { 48559566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 48569566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 4857071fcb05SBarry Smith } else c->diag = NULL; 48582205254eSKarl Rupp 4859f4259b30SLisandro Dalcin c->solve_work = NULL; 4860f4259b30SLisandro Dalcin c->saved_values = NULL; 4861f4259b30SLisandro Dalcin c->idiag = NULL; 4862f4259b30SLisandro Dalcin c->ssor_work = NULL; 4863a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4864e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4865e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 48666ad4291fSHong Zhang 4867893ad86cSHong Zhang c->rmax = a->rmax; 4868416022c9SBarry Smith c->nz = a->nz; 48698ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4870754ec7b1SSatish Balay 48716ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 48726ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4873cd6b891eSBarry Smith if (a->compressedrow.use) { 48746ad4291fSHong Zhang i = a->compressedrow.nrows; 48759566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 48769566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 48779566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 487827ea64f8SHong Zhang } else { 487927ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 48800298fd71SBarry Smith c->compressedrow.i = NULL; 48810298fd71SBarry Smith c->compressedrow.rindex = NULL; 48826ad4291fSHong Zhang } 4883ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4884e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 48854846f1f5SKris Buschelman 48869566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 488769272f91SPierre Jolivet } 48889566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 48893a40ed3dSBarry Smith PetscFunctionReturn(0); 489017ab2063SBarry Smith } 489117ab2063SBarry Smith 4892d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 4893d71ae5a4SJacob Faibussowitsch { 4894b24902e0SBarry Smith PetscFunctionBegin; 48959566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 48969566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 489748a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 48989566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 48999566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 4900b24902e0SBarry Smith PetscFunctionReturn(0); 4901b24902e0SBarry Smith } 4902b24902e0SBarry Smith 4903d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4904d71ae5a4SJacob Faibussowitsch { 490552f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 490652f91c60SVaclav Hapla 490752f91c60SVaclav Hapla PetscFunctionBegin; 490852f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 490952f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 4910c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 49119566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 49129566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 49139566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 491452f91c60SVaclav Hapla if (isbinary) { 49159566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 491652f91c60SVaclav Hapla } else if (ishdf5) { 491752f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 49189566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 491952f91c60SVaclav Hapla #else 492052f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 492152f91c60SVaclav Hapla #endif 492252f91c60SVaclav Hapla } else { 492398921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 492452f91c60SVaclav Hapla } 492552f91c60SVaclav Hapla PetscFunctionReturn(0); 492652f91c60SVaclav Hapla } 492752f91c60SVaclav Hapla 4928d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 4929d71ae5a4SJacob Faibussowitsch { 49303ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 49313ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 4932fbdbba38SShri Abhyankar 4933fbdbba38SShri Abhyankar PetscFunctionBegin; 49349566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 4935bbead8a2SBarry Smith 49363ea6fe3dSLisandro Dalcin /* read in matrix header */ 49379566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 493808401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 49399371c9d4SSatish Balay M = header[1]; 49409371c9d4SSatish Balay N = header[2]; 49419371c9d4SSatish Balay nz = header[3]; 494208401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 494308401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 494408401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 4945fbdbba38SShri Abhyankar 49463ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 49479566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 49483ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 49493ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 49503ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 49513ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 49523ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 49539566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 49549566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 49553ea6fe3dSLisandro Dalcin 49563ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 49579566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 4958aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 49593ea6fe3dSLisandro Dalcin 4960fbdbba38SShri Abhyankar /* read in row lengths */ 49619566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 49629566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 49633ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 49649371c9d4SSatish Balay sum = 0; 49659371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 496608401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 49673ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 49689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 49699566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 4970aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 49713ea6fe3dSLisandro Dalcin /* store row lengths */ 49729566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 49739566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 4974fbdbba38SShri Abhyankar 49753ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 49769371c9d4SSatish Balay a->i[0] = 0; 49779371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 49783ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 49799566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 49803ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 49819566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 4982fbdbba38SShri Abhyankar 49839566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 49849566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 4985fbdbba38SShri Abhyankar PetscFunctionReturn(0); 4986fbdbba38SShri Abhyankar } 4987fbdbba38SShri Abhyankar 4988d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 4989d71ae5a4SJacob Faibussowitsch { 49907264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 4991fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4992eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4993eeffb40dSHong Zhang PetscInt k; 4994eeffb40dSHong Zhang #endif 49957264ac53SSatish Balay 49963a40ed3dSBarry Smith PetscFunctionBegin; 4997bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 4998d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 4999ca44d042SBarry Smith *flg = PETSC_FALSE; 5000ca44d042SBarry Smith PetscFunctionReturn(0); 5001bcd2baecSBarry Smith } 50027264ac53SSatish Balay 50037264ac53SSatish Balay /* if the a->i are the same */ 50049566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 5005abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 50067264ac53SSatish Balay 50077264ac53SSatish Balay /* if a->j are the same */ 50089566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 5009abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 5010bcd2baecSBarry Smith 50119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5013bcd2baecSBarry Smith /* if a->a are the same */ 5014eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5015eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5016fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5017eeffb40dSHong Zhang *flg = PETSC_FALSE; 50183a40ed3dSBarry Smith PetscFunctionReturn(0); 5019eeffb40dSHong Zhang } 5020eeffb40dSHong Zhang } 5021eeffb40dSHong Zhang #else 50229566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5023eeffb40dSHong Zhang #endif 50249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 50259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 5026eeffb40dSHong Zhang PetscFunctionReturn(0); 50277264ac53SSatish Balay } 502836db0b34SBarry Smith 502905869f15SSatish Balay /*@ 503011a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 503136db0b34SBarry Smith provided by the user. 503236db0b34SBarry Smith 5033d083f849SBarry Smith Collective 503436db0b34SBarry Smith 503536db0b34SBarry Smith Input Parameters: 503636db0b34SBarry Smith + comm - must be an MPI communicator of size 1 503736db0b34SBarry Smith . m - number of rows 503836db0b34SBarry Smith . n - number of columns 5039483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 504036db0b34SBarry Smith . j - column indices 504136db0b34SBarry Smith - a - matrix values 504236db0b34SBarry Smith 504336db0b34SBarry Smith Output Parameter: 504436db0b34SBarry Smith . mat - the matrix 504536db0b34SBarry Smith 504636db0b34SBarry Smith Level: intermediate 504736db0b34SBarry Smith 504836db0b34SBarry Smith Notes: 50490551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 5050292fb18eSBarry Smith once the matrix is destroyed and not before 505136db0b34SBarry Smith 505236db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 505336db0b34SBarry Smith 5054bfeeae90SHong Zhang The i and j indices are 0 based 505536db0b34SBarry Smith 5056a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5057a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 50588eef79e4SBarry Smith as shown 5059a4552177SSatish Balay 50608eef79e4SBarry Smith $ 1 0 0 50618eef79e4SBarry Smith $ 2 0 3 50628eef79e4SBarry Smith $ 4 5 6 50638eef79e4SBarry Smith $ 50648eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 50658eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 50668eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 5067a4552177SSatish Balay 5068db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 506936db0b34SBarry Smith @*/ 5070d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5071d71ae5a4SJacob Faibussowitsch { 5072cbcfb4deSHong Zhang PetscInt ii; 507336db0b34SBarry Smith Mat_SeqAIJ *aij; 5074cbcfb4deSHong Zhang PetscInt jj; 507536db0b34SBarry Smith 507636db0b34SBarry Smith PetscFunctionBegin; 5077aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 50789566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 50799566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 50809566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 50819566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 50829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5083ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 50849566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 50859566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5086ab93d7beSBarry Smith 508736db0b34SBarry Smith aij->i = i; 508836db0b34SBarry Smith aij->j = j; 508936db0b34SBarry Smith aij->a = a; 509036db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 509136db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5092e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5093e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 509436db0b34SBarry Smith 5095cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 509636db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 509776bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5098aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 50999985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 510008401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 510108401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 51029985e31cSBarry Smith } 510336db0b34SBarry Smith } 510476bd3646SJed Brown } 510576bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 510636db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 510708401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5108aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 510936db0b34SBarry Smith } 511076bd3646SJed Brown } 511136db0b34SBarry Smith 51129566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 51139566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 511436db0b34SBarry Smith PetscFunctionReturn(0); 511536db0b34SBarry Smith } 5116cbc6b225SStefano Zampini 5117f62e3866SBarry Smith /*@ 511811a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 51198a0b0e6bSVictor Minden provided by the user. 51208a0b0e6bSVictor Minden 5121d083f849SBarry Smith Collective 51228a0b0e6bSVictor Minden 51238a0b0e6bSVictor Minden Input Parameters: 51248a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 51258a0b0e6bSVictor Minden . m - number of rows 51268a0b0e6bSVictor Minden . n - number of columns 51278a0b0e6bSVictor Minden . i - row indices 51288a0b0e6bSVictor Minden . j - column indices 51291230e6d1SVictor Minden . a - matrix values 51301230e6d1SVictor Minden . nz - number of nonzeros 513111a5261eSBarry Smith - idx - if the i and j indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 51328a0b0e6bSVictor Minden 51338a0b0e6bSVictor Minden Output Parameter: 51348a0b0e6bSVictor Minden . mat - the matrix 51358a0b0e6bSVictor Minden 51368a0b0e6bSVictor Minden Level: intermediate 51378a0b0e6bSVictor Minden 5138f62e3866SBarry Smith Example: 5139f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 51409e99939fSJunchao Zhang .vb 51418a0b0e6bSVictor Minden 1 0 0 51428a0b0e6bSVictor Minden 2 0 3 51438a0b0e6bSVictor Minden 4 5 6 51448a0b0e6bSVictor Minden 51458a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 51468a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 51478a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 51489e99939fSJunchao Zhang .ve 5149*d7547e51SJunchao Zhang Notes: 5150*d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5151*d7547e51SJunchao Zhang and are particularly useful in iterative applications. 51528a0b0e6bSVictor Minden 5153*d7547e51SJunchao Zhang .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 51548a0b0e6bSVictor Minden @*/ 5155d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5156d71ae5a4SJacob Faibussowitsch { 5157d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 51588a0b0e6bSVictor Minden 51598a0b0e6bSVictor Minden PetscFunctionBegin; 51609566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5161ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 51629566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51639566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51649566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 51661230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 51671230e6d1SVictor Minden if (idx) { 51681230e6d1SVictor Minden row = i[ii] - 1; 51691230e6d1SVictor Minden col = j[ii] - 1; 51701230e6d1SVictor Minden } else { 51711230e6d1SVictor Minden row = i[ii]; 51721230e6d1SVictor Minden col = j[ii]; 51738a0b0e6bSVictor Minden } 51749566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 51758a0b0e6bSVictor Minden } 51769566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 51779566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 51789566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 51798a0b0e6bSVictor Minden PetscFunctionReturn(0); 51808a0b0e6bSVictor Minden } 518136db0b34SBarry Smith 5182d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5183d71ae5a4SJacob Faibussowitsch { 5184acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5185acf2f550SJed Brown 5186acf2f550SJed Brown PetscFunctionBegin; 5187acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5188acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 51892205254eSKarl Rupp 51909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 5191acf2f550SJed Brown PetscFunctionReturn(0); 5192acf2f550SJed Brown } 5193acf2f550SJed Brown 5194d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5195d71ae5a4SJacob Faibussowitsch { 51969c8f2541SHong Zhang PetscFunctionBegin; 51979566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 51989c8f2541SHong Zhang PetscFunctionReturn(0); 51999c8f2541SHong Zhang } 52009c8f2541SHong Zhang 520181824310SBarry Smith /* 520253dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 520353dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 520453dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 520553dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 520653dd7562SDmitry Karpeev */ 5207d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5208d71ae5a4SJacob Faibussowitsch { 520953dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 521053dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 521153dd7562SDmitry Karpeev PetscBool seqaij; 521253dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 521353dd7562SDmitry Karpeev PetscScalar v; 521453dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 521553dd7562SDmitry Karpeev 521653dd7562SDmitry Karpeev PetscFunctionBegin; 521753dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 521853dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 52199566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 522028b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 522153dd7562SDmitry Karpeev if (rowemb) { 52229566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 522308401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 522453dd7562SDmitry Karpeev } else { 522508401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 522653dd7562SDmitry Karpeev } 522753dd7562SDmitry Karpeev if (colemb) { 52289566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 522908401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 523053dd7562SDmitry Karpeev } else { 523108401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 523253dd7562SDmitry Karpeev } 523353dd7562SDmitry Karpeev 523453dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ *)(B->data); 523553dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 52369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5237ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 52389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 52399566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 524053dd7562SDmitry Karpeev } 524148a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 524253dd7562SDmitry Karpeev count = 0; 524353dd7562SDmitry Karpeev rowindices = NULL; 524453dd7562SDmitry Karpeev colindices = NULL; 524548a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 524648a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 524753dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 524853dd7562SDmitry Karpeev PetscInt row; 524953dd7562SDmitry Karpeev row = i; 525053dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 525153dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 525253dd7562SDmitry Karpeev PetscInt col; 525353dd7562SDmitry Karpeev col = Baij->j[count]; 525453dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 525553dd7562SDmitry Karpeev v = Baij->a[count]; 52569566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 525753dd7562SDmitry Karpeev ++count; 525853dd7562SDmitry Karpeev } 525953dd7562SDmitry Karpeev } 526053dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 526153dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 526253dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 526353dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 526453dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 526553dd7562SDmitry Karpeev PetscFunctionReturn(0); 526653dd7562SDmitry Karpeev } 526753dd7562SDmitry Karpeev 52684099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 52694099cc6bSBarry Smith 52704099cc6bSBarry Smith /*@C 527111a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 52724099cc6bSBarry Smith 527311a5261eSBarry Smith Collective on mat 52744099cc6bSBarry Smith 52754099cc6bSBarry Smith Input Parameters: 52764099cc6bSBarry Smith + mat - the matrix object 52774099cc6bSBarry Smith - matype - matrix type 52784099cc6bSBarry Smith 52794099cc6bSBarry Smith Options Database Key: 52804099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 52814099cc6bSBarry Smith 52824099cc6bSBarry Smith Level: intermediate 52834099cc6bSBarry Smith 5284db781477SPatrick Sanan .seealso: `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`, `Mat` 52854099cc6bSBarry Smith @*/ 5286d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5287d71ae5a4SJacob Faibussowitsch { 52884099cc6bSBarry Smith PetscBool sametype; 52895f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 52904099cc6bSBarry Smith 52914099cc6bSBarry Smith PetscFunctionBegin; 52924099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 52939566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 52944099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 52954099cc6bSBarry Smith 52969566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 52975f80ce2aSJacob Faibussowitsch PetscCheck(r, PETSC_COMM_SELF, PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 52989566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 52994099cc6bSBarry Smith PetscFunctionReturn(0); 53004099cc6bSBarry Smith } 53014099cc6bSBarry Smith 53024099cc6bSBarry Smith /*@C 530311a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 53044099cc6bSBarry Smith 53054099cc6bSBarry Smith Not Collective 53064099cc6bSBarry Smith 53074099cc6bSBarry Smith Input Parameters: 530811a5261eSBarry Smith + name - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 53094099cc6bSBarry Smith - function - routine to convert to subtype 53104099cc6bSBarry Smith 53114099cc6bSBarry Smith Notes: 531211a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 53134099cc6bSBarry Smith 53144099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 53154099cc6bSBarry Smith $ -mat_seqaij_type my_mat 53164099cc6bSBarry Smith 53174099cc6bSBarry Smith Level: advanced 53184099cc6bSBarry Smith 5319db781477SPatrick Sanan .seealso: `MatSeqAIJRegisterAll()` 53204099cc6bSBarry Smith @*/ 5321d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5322d71ae5a4SJacob Faibussowitsch { 53234099cc6bSBarry Smith PetscFunctionBegin; 53249566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 53259566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 53264099cc6bSBarry Smith PetscFunctionReturn(0); 53274099cc6bSBarry Smith } 53284099cc6bSBarry Smith 53294099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 53304099cc6bSBarry Smith 53314099cc6bSBarry Smith /*@C 533211a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 53334099cc6bSBarry Smith 53344099cc6bSBarry Smith Not Collective 53354099cc6bSBarry Smith 53364099cc6bSBarry Smith Level: advanced 53374099cc6bSBarry Smith 5338db781477SPatrick Sanan .seealso: `MatRegisterAll()`, `MatSeqAIJRegister()` 53394099cc6bSBarry Smith @*/ 5340d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5341d71ae5a4SJacob Faibussowitsch { 53424099cc6bSBarry Smith PetscFunctionBegin; 53434099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 53444099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 53454099cc6bSBarry Smith 53469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 53479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 53489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 53499779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 53509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5351485f9817SRichard Tran Mills #endif 53525063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 53539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 53545063d097SStefano Zampini #endif 53555063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 53569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 53575063d097SStefano Zampini #endif 53584099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 53599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 53604099cc6bSBarry Smith #endif 53614099cc6bSBarry Smith PetscFunctionReturn(0); 53624099cc6bSBarry Smith } 536353dd7562SDmitry Karpeev 536453dd7562SDmitry Karpeev /* 536581824310SBarry Smith Special version for direct calls from Fortran 536681824310SBarry Smith */ 5367af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 536881824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 536981824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 537081824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 537181824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 537281824310SBarry Smith #endif 537381824310SBarry Smith 537481824310SBarry Smith /* Change these macros so can be used in void function */ 537598921bdaSJacob Faibussowitsch 537698921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 53779566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 53789566063dSJacob Faibussowitsch #undef PetscCall 53799371c9d4SSatish Balay #define PetscCall(...) \ 53809371c9d4SSatish Balay do { \ 53815f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 538298921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 538398921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 538498921bdaSJacob Faibussowitsch return; \ 538598921bdaSJacob Faibussowitsch } \ 538698921bdaSJacob Faibussowitsch } while (0) 538798921bdaSJacob Faibussowitsch 538898921bdaSJacob Faibussowitsch #undef SETERRQ 53899371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 53909371c9d4SSatish Balay do { \ 539198921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 539298921bdaSJacob Faibussowitsch return; \ 539398921bdaSJacob Faibussowitsch } while (0) 539481824310SBarry Smith 5395d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5396d71ae5a4SJacob Faibussowitsch { 539781824310SBarry Smith Mat A = *AA; 539881824310SBarry Smith PetscInt m = *mm, n = *nn; 539981824310SBarry Smith InsertMode is = *isis; 540081824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 540181824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 540281824310SBarry Smith PetscInt *imax, *ai, *ailen; 540381824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 540454f21887SBarry Smith MatScalar *ap, value, *aa; 5405ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5406ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 540781824310SBarry Smith 540881824310SBarry Smith PetscFunctionBegin; 54094994cf47SJed Brown MatCheckPreallocated(A, 1); 541081824310SBarry Smith imax = a->imax; 541181824310SBarry Smith ai = a->i; 541281824310SBarry Smith ailen = a->ilen; 541381824310SBarry Smith aj = a->j; 541481824310SBarry Smith aa = a->a; 541581824310SBarry Smith 541681824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 541781824310SBarry Smith row = im[k]; 541881824310SBarry Smith if (row < 0) continue; 54195f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 54209371c9d4SSatish Balay rp = aj + ai[row]; 54219371c9d4SSatish Balay ap = aa + ai[row]; 54229371c9d4SSatish Balay rmax = imax[row]; 54239371c9d4SSatish Balay nrow = ailen[row]; 542481824310SBarry Smith low = 0; 542581824310SBarry Smith high = nrow; 542681824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 542781824310SBarry Smith if (in[l] < 0) continue; 54285f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 542981824310SBarry Smith col = in[l]; 54302205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 54312205254eSKarl Rupp else value = v[k + l * m]; 54322205254eSKarl Rupp 543381824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 543481824310SBarry Smith 54352205254eSKarl Rupp if (col <= lastcol) low = 0; 54362205254eSKarl Rupp else high = nrow; 543781824310SBarry Smith lastcol = col; 543881824310SBarry Smith while (high - low > 5) { 543981824310SBarry Smith t = (low + high) / 2; 544081824310SBarry Smith if (rp[t] > col) high = t; 544181824310SBarry Smith else low = t; 544281824310SBarry Smith } 544381824310SBarry Smith for (i = low; i < high; i++) { 544481824310SBarry Smith if (rp[i] > col) break; 544581824310SBarry Smith if (rp[i] == col) { 544681824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 544781824310SBarry Smith else ap[i] = value; 544881824310SBarry Smith goto noinsert; 544981824310SBarry Smith } 545081824310SBarry Smith } 545181824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 545281824310SBarry Smith if (nonew == 1) goto noinsert; 54535f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5454fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 54559371c9d4SSatish Balay N = nrow++ - 1; 54569371c9d4SSatish Balay a->nz++; 54579371c9d4SSatish Balay high++; 545881824310SBarry Smith /* shift up all the later entries in this row */ 545981824310SBarry Smith for (ii = N; ii >= i; ii--) { 546081824310SBarry Smith rp[ii + 1] = rp[ii]; 546181824310SBarry Smith ap[ii + 1] = ap[ii]; 546281824310SBarry Smith } 546381824310SBarry Smith rp[i] = col; 546481824310SBarry Smith ap[i] = value; 5465e56f5c9eSBarry Smith A->nonzerostate++; 546681824310SBarry Smith noinsert:; 546781824310SBarry Smith low = i + 1; 546881824310SBarry Smith } 546981824310SBarry Smith ailen[row] = nrow; 547081824310SBarry Smith } 547181824310SBarry Smith PetscFunctionReturnVoid(); 547281824310SBarry Smith } 547398921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 547498921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 547598921bdaSJacob Faibussowitsch * original definitions */ 54769566063dSJacob Faibussowitsch #undef PetscCall 547798921bdaSJacob Faibussowitsch #undef SETERRQ 5478