xref: /petsc/src/mat/impls/sell/seq/fdsell.c (revision 9371c9d470a9602b6d10a8bf50c9b2280a79e45a)
1d4002b98SHong Zhang #include <../src/mat/impls/sell/seq/sell.h>
2d4002b98SHong Zhang #include <../src/mat/impls/aij/seq/aij.h>
3d4002b98SHong Zhang #include <petsc/private/isimpl.h>
4d4002b98SHong Zhang 
5d4002b98SHong Zhang /*
6d4002b98SHong Zhang  MatGetColumnIJ_SeqSELL_Color() and MatRestoreColumnIJ_SeqSELL_Color() are customized from
7d4002b98SHong Zhang  MatGetColumnIJ_SeqSELL() and MatRestoreColumnIJ_SeqSELL() by adding an output
8d4002b98SHong Zhang  spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqSELL() and MatFDColoringCreate_SeqSELL()
9d4002b98SHong Zhang */
10*9371c9d4SSatish Balay PetscErrorCode MatGetColumnIJ_SeqSELL_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) {
11d4002b98SHong Zhang   Mat_SeqSELL *a = (Mat_SeqSELL *)A->data;
12d4002b98SHong Zhang   PetscInt     i, j, *collengths, *cia, *cja, n = A->cmap->n, totalslices;
13d4002b98SHong Zhang   PetscInt     row, col;
14d4002b98SHong Zhang   PetscInt    *cspidx;
15d4002b98SHong Zhang   PetscBool    isnonzero;
16d4002b98SHong Zhang 
17d4002b98SHong Zhang   PetscFunctionBegin;
18d4002b98SHong Zhang   *nn = n;
19d4002b98SHong Zhang   if (!ia) PetscFunctionReturn(0);
20d4002b98SHong Zhang 
219566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(n + 1, &collengths));
229566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n + 1, &cia));
239566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(a->nz + 1, &cja));
249566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(a->nz + 1, &cspidx));
25d4002b98SHong Zhang 
26d4002b98SHong Zhang   totalslices = A->rmap->n / 8 + ((A->rmap->n & 0x07) ? 1 : 0); /* floor(n/8) */
27d4002b98SHong Zhang   for (i = 0; i < totalslices; i++) {                           /* loop over slices */
28d4002b98SHong Zhang     for (j = a->sliidx[i], row = 0; j < a->sliidx[i + 1]; j++, row = ((row + 1) & 0x07)) {
29d4002b98SHong Zhang       isnonzero = (PetscBool)((j - a->sliidx[i]) / 8 < a->rlen[8 * i + row]);
30d4002b98SHong Zhang       if (isnonzero) collengths[a->colidx[j]]++;
31d4002b98SHong Zhang     }
32d4002b98SHong Zhang   }
33d4002b98SHong Zhang 
34d4002b98SHong Zhang   cia[0] = oshift;
35*9371c9d4SSatish Balay   for (i = 0; i < n; i++) { cia[i + 1] = cia[i] + collengths[i]; }
369566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(collengths, n));
37d4002b98SHong Zhang 
38d4002b98SHong Zhang   for (i = 0; i < totalslices; i++) { /* loop over slices */
39d4002b98SHong Zhang     for (j = a->sliidx[i], row = 0; j < a->sliidx[i + 1]; j++, row = ((row + 1) & 0x07)) {
40d4002b98SHong Zhang       isnonzero = (PetscBool)((j - a->sliidx[i]) / 8 < a->rlen[8 * i + row]);
41d4002b98SHong Zhang       if (isnonzero) {
42d4002b98SHong Zhang         col                                         = a->colidx[j];
43d4002b98SHong Zhang         cspidx[cia[col] + collengths[col] - oshift] = j;                    /* index of a->colidx */
44d4002b98SHong Zhang         cja[cia[col] + collengths[col] - oshift]    = 8 * i + row + oshift; /* row index */
45d4002b98SHong Zhang         collengths[col]++;
46d4002b98SHong Zhang       }
47d4002b98SHong Zhang     }
48d4002b98SHong Zhang   }
49d4002b98SHong Zhang 
509566063dSJacob Faibussowitsch   PetscCall(PetscFree(collengths));
51*9371c9d4SSatish Balay   *ia    = cia;
52*9371c9d4SSatish Balay   *ja    = cja;
53d4002b98SHong Zhang   *spidx = cspidx;
54d4002b98SHong Zhang   PetscFunctionReturn(0);
55d4002b98SHong Zhang }
56d4002b98SHong Zhang 
57*9371c9d4SSatish Balay PetscErrorCode MatRestoreColumnIJ_SeqSELL_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) {
58d4002b98SHong Zhang   PetscFunctionBegin;
59d4002b98SHong Zhang 
60d4002b98SHong Zhang   if (!ia) PetscFunctionReturn(0);
619566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ia));
629566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ja));
639566063dSJacob Faibussowitsch   PetscCall(PetscFree(*spidx));
64d4002b98SHong Zhang   PetscFunctionReturn(0);
65d4002b98SHong Zhang }
66