1d4002b98SHong Zhang #include <../src/mat/impls/sell/seq/sell.h> 2d4002b98SHong Zhang #include <../src/mat/impls/aij/seq/aij.h> 3d4002b98SHong Zhang #include <petsc/private/isimpl.h> 4d4002b98SHong Zhang 5d4002b98SHong Zhang /* 6d4002b98SHong Zhang MatGetColumnIJ_SeqSELL_Color() and MatRestoreColumnIJ_SeqSELL_Color() are customized from 7d4002b98SHong Zhang MatGetColumnIJ_SeqSELL() and MatRestoreColumnIJ_SeqSELL() by adding an output 8d4002b98SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqSELL() and MatFDColoringCreate_SeqSELL() 9d4002b98SHong Zhang */ 109371c9d4SSatish Balay PetscErrorCode MatGetColumnIJ_SeqSELL_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) { 11d4002b98SHong Zhang Mat_SeqSELL *a = (Mat_SeqSELL *)A->data; 12d4002b98SHong Zhang PetscInt i, j, *collengths, *cia, *cja, n = A->cmap->n, totalslices; 13d4002b98SHong Zhang PetscInt row, col; 14d4002b98SHong Zhang PetscInt *cspidx; 15d4002b98SHong Zhang PetscBool isnonzero; 16d4002b98SHong Zhang 17d4002b98SHong Zhang PetscFunctionBegin; 18d4002b98SHong Zhang *nn = n; 19d4002b98SHong Zhang if (!ia) PetscFunctionReturn(0); 20d4002b98SHong Zhang 219566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n + 1, &collengths)); 229566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->nz + 1, &cja)); 249566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->nz + 1, &cspidx)); 25d4002b98SHong Zhang 26d4002b98SHong Zhang totalslices = A->rmap->n / 8 + ((A->rmap->n & 0x07) ? 1 : 0); /* floor(n/8) */ 27d4002b98SHong Zhang for (i = 0; i < totalslices; i++) { /* loop over slices */ 28d4002b98SHong Zhang for (j = a->sliidx[i], row = 0; j < a->sliidx[i + 1]; j++, row = ((row + 1) & 0x07)) { 29d4002b98SHong Zhang isnonzero = (PetscBool)((j - a->sliidx[i]) / 8 < a->rlen[8 * i + row]); 30d4002b98SHong Zhang if (isnonzero) collengths[a->colidx[j]]++; 31d4002b98SHong Zhang } 32d4002b98SHong Zhang } 33d4002b98SHong Zhang 34d4002b98SHong Zhang cia[0] = oshift; 35*ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 369566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 37d4002b98SHong Zhang 38d4002b98SHong Zhang for (i = 0; i < totalslices; i++) { /* loop over slices */ 39d4002b98SHong Zhang for (j = a->sliidx[i], row = 0; j < a->sliidx[i + 1]; j++, row = ((row + 1) & 0x07)) { 40d4002b98SHong Zhang isnonzero = (PetscBool)((j - a->sliidx[i]) / 8 < a->rlen[8 * i + row]); 41d4002b98SHong Zhang if (isnonzero) { 42d4002b98SHong Zhang col = a->colidx[j]; 43d4002b98SHong Zhang cspidx[cia[col] + collengths[col] - oshift] = j; /* index of a->colidx */ 44d4002b98SHong Zhang cja[cia[col] + collengths[col] - oshift] = 8 * i + row + oshift; /* row index */ 45d4002b98SHong Zhang collengths[col]++; 46d4002b98SHong Zhang } 47d4002b98SHong Zhang } 48d4002b98SHong Zhang } 49d4002b98SHong Zhang 509566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 519371c9d4SSatish Balay *ia = cia; 529371c9d4SSatish Balay *ja = cja; 53d4002b98SHong Zhang *spidx = cspidx; 54d4002b98SHong Zhang PetscFunctionReturn(0); 55d4002b98SHong Zhang } 56d4002b98SHong Zhang 579371c9d4SSatish Balay PetscErrorCode MatRestoreColumnIJ_SeqSELL_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) { 58d4002b98SHong Zhang PetscFunctionBegin; 59d4002b98SHong Zhang 60d4002b98SHong Zhang if (!ia) PetscFunctionReturn(0); 619566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 629566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 639566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 64d4002b98SHong Zhang PetscFunctionReturn(0); 65d4002b98SHong Zhang } 66