xref: /petsc/src/mat/impls/preallocator/matpreallocator.c (revision 5dca110499e32689380d6e7596456fdb2c00edd9)
1c094ef40SMatthew G. Knepley #include <petsc/private/matimpl.h>      /*I "petscmat.h" I*/
2e8f14785SLisandro Dalcin #include <petsc/private/hashsetij.h>
3c094ef40SMatthew G. Knepley 
4c094ef40SMatthew G. Knepley typedef struct {
5e8f14785SLisandro Dalcin   PetscHSetIJ ht;
6c094ef40SMatthew G. Knepley   PetscInt   *dnz, *onz;
7c09129f1SStefano Zampini   PetscInt   *dnzu, *onzu;
8c094ef40SMatthew G. Knepley } Mat_Preallocator;
9c094ef40SMatthew G. Knepley 
10c094ef40SMatthew G. Knepley PetscErrorCode MatDestroy_Preallocator(Mat A)
11c094ef40SMatthew G. Knepley {
12c094ef40SMatthew G. Knepley   Mat_Preallocator *p = (Mat_Preallocator *) A->data;
13c094ef40SMatthew G. Knepley   PetscErrorCode    ierr;
14c094ef40SMatthew G. Knepley 
15c094ef40SMatthew G. Knepley   PetscFunctionBegin;
16c094ef40SMatthew G. Knepley   ierr = MatStashDestroy_Private(&A->stash);CHKERRQ(ierr);
17e8f14785SLisandro Dalcin   ierr = PetscHSetIJDestroy(&p->ht);CHKERRQ(ierr);
18c09129f1SStefano Zampini   ierr = PetscFree4(p->dnz, p->onz, p->dnzu, p->onzu);CHKERRQ(ierr);
19c094ef40SMatthew G. Knepley   ierr = PetscFree(A->data);CHKERRQ(ierr);
20c094ef40SMatthew G. Knepley   ierr = PetscObjectChangeTypeName((PetscObject) A, 0);CHKERRQ(ierr);
21c094ef40SMatthew G. Knepley   ierr = PetscObjectComposeFunction((PetscObject) A, "MatPreallocatorPreallocate_C", NULL);CHKERRQ(ierr);
22c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
23c094ef40SMatthew G. Knepley }
24c094ef40SMatthew G. Knepley 
25c094ef40SMatthew G. Knepley PetscErrorCode MatSetUp_Preallocator(Mat A)
26c094ef40SMatthew G. Knepley {
27c094ef40SMatthew G. Knepley   Mat_Preallocator *p = (Mat_Preallocator *) A->data;
28*5dca1104SStefano Zampini   PetscInt          m, bs, mbs;
29c094ef40SMatthew G. Knepley   PetscErrorCode    ierr;
30c094ef40SMatthew G. Knepley 
31c094ef40SMatthew G. Knepley   PetscFunctionBegin;
32c094ef40SMatthew G. Knepley   ierr = PetscLayoutSetUp(A->rmap);CHKERRQ(ierr);
33c094ef40SMatthew G. Knepley   ierr = PetscLayoutSetUp(A->cmap);CHKERRQ(ierr);
34c094ef40SMatthew G. Knepley   ierr = MatGetLocalSize(A, &m, NULL);CHKERRQ(ierr);
35e8f14785SLisandro Dalcin   ierr = PetscHSetIJCreate(&p->ht);CHKERRQ(ierr);
36c094ef40SMatthew G. Knepley   ierr = MatGetBlockSize(A, &bs);CHKERRQ(ierr);
37c094ef40SMatthew G. Knepley   ierr = MatStashCreate_Private(PetscObjectComm((PetscObject) A), bs, &A->stash);CHKERRQ(ierr);
38*5dca1104SStefano Zampini   /* arrays are for blocked rows/cols */
39*5dca1104SStefano Zampini   mbs  = m/bs;
40*5dca1104SStefano Zampini   ierr = PetscCalloc4(mbs, &p->dnz, mbs, &p->onz, mbs, &p->dnzu, mbs, &p->onzu);CHKERRQ(ierr);
41c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
42c094ef40SMatthew G. Knepley }
43c094ef40SMatthew G. Knepley 
44c094ef40SMatthew G. Knepley PetscErrorCode MatSetValues_Preallocator(Mat A, PetscInt m, const PetscInt *rows, PetscInt n, const PetscInt *cols, const PetscScalar *values, InsertMode addv)
45c094ef40SMatthew G. Knepley {
46c094ef40SMatthew G. Knepley   Mat_Preallocator *p = (Mat_Preallocator *) A->data;
47*5dca1104SStefano Zampini   PetscInt          rStart, rEnd, r, cStart, cEnd, c, bs;
48c094ef40SMatthew G. Knepley   PetscErrorCode    ierr;
49c094ef40SMatthew G. Knepley 
50c094ef40SMatthew G. Knepley   PetscFunctionBegin;
51*5dca1104SStefano Zampini   ierr = MatGetBlockSize(A, &bs);CHKERRQ(ierr);
52c094ef40SMatthew G. Knepley   ierr = MatGetOwnershipRange(A, &rStart, &rEnd);CHKERRQ(ierr);
53c094ef40SMatthew G. Knepley   ierr = MatGetOwnershipRangeColumn(A, &cStart, &cEnd);CHKERRQ(ierr);
54c094ef40SMatthew G. Knepley   for (r = 0; r < m; ++r) {
55e8f14785SLisandro Dalcin     PetscHashIJKey key;
56e8f14785SLisandro Dalcin     PetscBool      missing;
57c094ef40SMatthew G. Knepley 
58e8f14785SLisandro Dalcin     key.i = rows[r];
59e8f14785SLisandro Dalcin     if (key.i < 0) continue;
60e8f14785SLisandro Dalcin     if ((key.i < rStart) || (key.i >= rEnd)) {
61e8f14785SLisandro Dalcin       ierr = MatStashValuesRow_Private(&A->stash, key.i, n, cols, values, PETSC_FALSE);CHKERRQ(ierr);
62*5dca1104SStefano Zampini     } else { /* Hash table is for blocked rows/cols */
63*5dca1104SStefano Zampini       key.i = rows[r]/bs;
64c094ef40SMatthew G. Knepley       for (c = 0; c < n; ++c) {
65*5dca1104SStefano Zampini         key.j = cols[c]/bs;
66e8f14785SLisandro Dalcin         if (key.j < 0) continue;
67e8f14785SLisandro Dalcin         ierr = PetscHSetIJQueryAdd(p->ht, key, &missing);CHKERRQ(ierr);
68c094ef40SMatthew G. Knepley         if (missing) {
69*5dca1104SStefano Zampini           if ((key.j >= cStart/bs) && (key.j < cEnd/bs)) {
70*5dca1104SStefano Zampini             ++p->dnz[key.i-rStart/bs];
71*5dca1104SStefano Zampini             if (key.j >= key.i) ++p->dnzu[key.i-rStart/bs];
72c09129f1SStefano Zampini           } else {
73*5dca1104SStefano Zampini             ++p->onz[key.i-rStart/bs];
74*5dca1104SStefano Zampini             if (key.j >= key.i) ++p->onzu[key.i-rStart/bs];
75c09129f1SStefano Zampini           }
76c094ef40SMatthew G. Knepley         }
77c094ef40SMatthew G. Knepley       }
78c094ef40SMatthew G. Knepley     }
79c094ef40SMatthew G. Knepley   }
80c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
81c094ef40SMatthew G. Knepley }
82c094ef40SMatthew G. Knepley 
83c094ef40SMatthew G. Knepley PetscErrorCode MatAssemblyBegin_Preallocator(Mat A, MatAssemblyType type)
84c094ef40SMatthew G. Knepley {
85c094ef40SMatthew G. Knepley   PetscInt       nstash, reallocs;
86c094ef40SMatthew G. Knepley   PetscErrorCode ierr;
87c094ef40SMatthew G. Knepley 
88c094ef40SMatthew G. Knepley   PetscFunctionBegin;
89c094ef40SMatthew G. Knepley   ierr = MatStashScatterBegin_Private(A, &A->stash, A->rmap->range);CHKERRQ(ierr);
90c094ef40SMatthew G. Knepley   ierr = MatStashGetInfo_Private(&A->stash, &nstash, &reallocs);CHKERRQ(ierr);
91c094ef40SMatthew G. Knepley   ierr = PetscInfo2(A, "Stash has %D entries, uses %D mallocs.\n", nstash, reallocs);CHKERRQ(ierr);
92c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
93c094ef40SMatthew G. Knepley }
94c094ef40SMatthew G. Knepley 
95c094ef40SMatthew G. Knepley PetscErrorCode MatAssemblyEnd_Preallocator(Mat A, MatAssemblyType type)
96c094ef40SMatthew G. Knepley {
97c094ef40SMatthew G. Knepley   PetscScalar   *val;
98c094ef40SMatthew G. Knepley   PetscInt      *row, *col;
99c094ef40SMatthew G. Knepley   PetscInt       i, j, rstart, ncols, flg;
100c094ef40SMatthew G. Knepley   PetscMPIInt    n;
101c094ef40SMatthew G. Knepley   PetscErrorCode ierr;
102c094ef40SMatthew G. Knepley 
103c094ef40SMatthew G. Knepley   PetscFunctionBegin;
104c094ef40SMatthew G. Knepley   while (1) {
105c094ef40SMatthew G. Knepley     ierr = MatStashScatterGetMesg_Private(&A->stash, &n, &row, &col, &val, &flg);CHKERRQ(ierr);
106c094ef40SMatthew G. Knepley     if (!flg) break;
107c094ef40SMatthew G. Knepley 
108c094ef40SMatthew G. Knepley     for (i = 0; i < n; ) {
109c094ef40SMatthew G. Knepley       /* Now identify the consecutive vals belonging to the same row */
110c094ef40SMatthew G. Knepley       for (j = i, rstart = row[j]; j < n; j++) {
111c094ef40SMatthew G. Knepley         if (row[j] != rstart) break;
112c094ef40SMatthew G. Knepley       }
113c094ef40SMatthew G. Knepley       if (j < n) ncols = j-i;
114c094ef40SMatthew G. Knepley       else       ncols = n-i;
115c094ef40SMatthew G. Knepley       /* Now assemble all these values with a single function call */
116c094ef40SMatthew G. Knepley       ierr = MatSetValues_Preallocator(A, 1, row+i, ncols, col+i, val+i, INSERT_VALUES);CHKERRQ(ierr);
117c094ef40SMatthew G. Knepley       i = j;
118c094ef40SMatthew G. Knepley     }
119c094ef40SMatthew G. Knepley   }
120c094ef40SMatthew G. Knepley   ierr = MatStashScatterEnd_Private(&A->stash);CHKERRQ(ierr);
121c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
122c094ef40SMatthew G. Knepley }
123c094ef40SMatthew G. Knepley 
124c094ef40SMatthew G. Knepley PetscErrorCode MatView_Preallocator(Mat A, PetscViewer viewer)
125c094ef40SMatthew G. Knepley {
126c094ef40SMatthew G. Knepley   PetscFunctionBegin;
127c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
128c094ef40SMatthew G. Knepley }
129c094ef40SMatthew G. Knepley 
130c094ef40SMatthew G. Knepley PetscErrorCode MatSetOption_Preallocator(Mat A, MatOption op, PetscBool flg)
131c094ef40SMatthew G. Knepley {
132c094ef40SMatthew G. Knepley   PetscFunctionBegin;
133c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
134c094ef40SMatthew G. Knepley }
135c094ef40SMatthew G. Knepley 
136c094ef40SMatthew G. Knepley PetscErrorCode MatPreallocatorPreallocate_Preallocator(Mat mat, PetscBool fill, Mat A)
137c094ef40SMatthew G. Knepley {
138c094ef40SMatthew G. Knepley   Mat_Preallocator *p = (Mat_Preallocator *) mat->data;
139c094ef40SMatthew G. Knepley   PetscInt          bs;
140c094ef40SMatthew G. Knepley   PetscErrorCode    ierr;
141c094ef40SMatthew G. Knepley 
142c094ef40SMatthew G. Knepley   PetscFunctionBegin;
143c094ef40SMatthew G. Knepley   ierr = MatGetBlockSize(mat, &bs);CHKERRQ(ierr);
144c09129f1SStefano Zampini   ierr = MatXAIJSetPreallocation(A, bs, p->dnz, p->onz, p->dnzu, p->onzu);CHKERRQ(ierr);
145c094ef40SMatthew G. Knepley   ierr = MatSetOption(A, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE);CHKERRQ(ierr);
146c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
147c094ef40SMatthew G. Knepley }
148c094ef40SMatthew G. Knepley 
149c094ef40SMatthew G. Knepley /*@
150c094ef40SMatthew G. Knepley   MatPreallocatorPreallocate - Preallocates the input matrix, optionally filling it with zeros
151c094ef40SMatthew G. Knepley 
152c094ef40SMatthew G. Knepley   Input Parameter:
153c094ef40SMatthew G. Knepley + mat  - the preallocator
154c094ef40SMatthew G. Knepley - fill - fill the matrix with zeros
155c094ef40SMatthew G. Knepley 
156c094ef40SMatthew G. Knepley   Output Parameter:
157c094ef40SMatthew G. Knepley . A    - the matrix
158c094ef40SMatthew G. Knepley 
159c094ef40SMatthew G. Knepley   Level: advanced
160c094ef40SMatthew G. Knepley 
161c094ef40SMatthew G. Knepley .seealso: MATPREALLOCATOR
162c094ef40SMatthew G. Knepley @*/
163c094ef40SMatthew G. Knepley PetscErrorCode MatPreallocatorPreallocate(Mat mat, PetscBool fill, Mat A)
164c094ef40SMatthew G. Knepley {
165c094ef40SMatthew G. Knepley   PetscErrorCode ierr;
166c094ef40SMatthew G. Knepley 
167c094ef40SMatthew G. Knepley   PetscFunctionBegin;
168c094ef40SMatthew G. Knepley   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
169c094ef40SMatthew G. Knepley   PetscValidHeaderSpecific(A,   MAT_CLASSID, 3);
170c094ef40SMatthew G. Knepley   ierr = PetscUseMethod(mat, "MatPreallocatorPreallocate_C", (Mat,PetscBool,Mat),(mat,fill,A));CHKERRQ(ierr);
171c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
172c094ef40SMatthew G. Knepley }
173c094ef40SMatthew G. Knepley 
174c094ef40SMatthew G. Knepley /*MC
175c094ef40SMatthew G. Knepley    MATPREALLOCATOR - MATPREALLOCATOR = "preallocator" - A matrix type to be used for computing a matrix preallocation.
176c094ef40SMatthew G. Knepley 
177c094ef40SMatthew G. Knepley    Operations Provided:
178c094ef40SMatthew G. Knepley .  MatSetValues()
179c094ef40SMatthew G. Knepley 
180c094ef40SMatthew G. Knepley    Options Database Keys:
181c094ef40SMatthew G. Knepley . -mat_type preallocator - sets the matrix type to "preallocator" during a call to MatSetFromOptions()
182c094ef40SMatthew G. Knepley 
183c094ef40SMatthew G. Knepley   Level: advanced
184c094ef40SMatthew G. Knepley 
185c094ef40SMatthew G. Knepley .seealso: Mat
186c094ef40SMatthew G. Knepley 
187c094ef40SMatthew G. Knepley M*/
188c094ef40SMatthew G. Knepley 
189c094ef40SMatthew G. Knepley PETSC_EXTERN PetscErrorCode MatCreate_Preallocator(Mat A)
190c094ef40SMatthew G. Knepley {
191c094ef40SMatthew G. Knepley   Mat_Preallocator *p;
192c094ef40SMatthew G. Knepley   PetscErrorCode    ierr;
193c094ef40SMatthew G. Knepley 
194c094ef40SMatthew G. Knepley   PetscFunctionBegin;
195c094ef40SMatthew G. Knepley   ierr = PetscNewLog(A, &p);CHKERRQ(ierr);
196c094ef40SMatthew G. Knepley   A->data = (void *) p;
197c094ef40SMatthew G. Knepley 
198c094ef40SMatthew G. Knepley   p->ht   = NULL;
199c094ef40SMatthew G. Knepley   p->dnz  = NULL;
200c094ef40SMatthew G. Knepley   p->onz  = NULL;
201c09129f1SStefano Zampini   p->dnzu = NULL;
202c09129f1SStefano Zampini   p->onzu = NULL;
203c094ef40SMatthew G. Knepley 
204c094ef40SMatthew G. Knepley   /* matrix ops */
205c094ef40SMatthew G. Knepley   ierr = PetscMemzero(A->ops, sizeof(struct _MatOps));CHKERRQ(ierr);
206c09129f1SStefano Zampini 
207c094ef40SMatthew G. Knepley   A->ops->destroy       = MatDestroy_Preallocator;
208c094ef40SMatthew G. Knepley   A->ops->setup         = MatSetUp_Preallocator;
209c094ef40SMatthew G. Knepley   A->ops->setvalues     = MatSetValues_Preallocator;
210c094ef40SMatthew G. Knepley   A->ops->assemblybegin = MatAssemblyBegin_Preallocator;
211c094ef40SMatthew G. Knepley   A->ops->assemblyend   = MatAssemblyEnd_Preallocator;
212c094ef40SMatthew G. Knepley   A->ops->view          = MatView_Preallocator;
213c094ef40SMatthew G. Knepley   A->ops->setoption     = MatSetOption_Preallocator;
214*5dca1104SStefano Zampini   A->ops->setblocksizes = MatSetBlockSizes_Default; /* once set, user is not allowed to change the block sizes */
215c094ef40SMatthew G. Knepley 
216c094ef40SMatthew G. Knepley   /* special MATPREALLOCATOR functions */
217c094ef40SMatthew G. Knepley   ierr = PetscObjectComposeFunction((PetscObject) A, "MatPreallocatorPreallocate_C", MatPreallocatorPreallocate_Preallocator);CHKERRQ(ierr);
218c094ef40SMatthew G. Knepley   ierr = PetscObjectChangeTypeName((PetscObject) A, MATPREALLOCATOR);CHKERRQ(ierr);
219c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
220c094ef40SMatthew G. Knepley }
221