xref: /petsc/src/mat/impls/preallocator/matpreallocator.c (revision c09129f1575ca10e91085867db66f4d9c9ac2b6c)
1c094ef40SMatthew G. Knepley #include <petsc/private/matimpl.h>      /*I "petscmat.h" I*/
2e8f14785SLisandro Dalcin #include <petsc/private/hashsetij.h>
3c094ef40SMatthew G. Knepley 
4c094ef40SMatthew G. Knepley typedef struct {
5e8f14785SLisandro Dalcin   PetscHSetIJ ht;
6c094ef40SMatthew G. Knepley   PetscInt   *dnz, *onz;
7*c09129f1SStefano Zampini   PetscInt   *dnzu, *onzu;
8c094ef40SMatthew G. Knepley } Mat_Preallocator;
9c094ef40SMatthew G. Knepley 
10c094ef40SMatthew G. Knepley PetscErrorCode MatDestroy_Preallocator(Mat A)
11c094ef40SMatthew G. Knepley {
12c094ef40SMatthew G. Knepley   Mat_Preallocator *p = (Mat_Preallocator *) A->data;
13c094ef40SMatthew G. Knepley   PetscErrorCode    ierr;
14c094ef40SMatthew G. Knepley 
15c094ef40SMatthew G. Knepley   PetscFunctionBegin;
16c094ef40SMatthew G. Knepley   ierr = MatStashDestroy_Private(&A->stash);CHKERRQ(ierr);
17e8f14785SLisandro Dalcin   ierr = PetscHSetIJDestroy(&p->ht);CHKERRQ(ierr);
18*c09129f1SStefano Zampini   ierr = PetscFree4(p->dnz, p->onz, p->dnzu, p->onzu);CHKERRQ(ierr);
19c094ef40SMatthew G. Knepley   ierr = PetscFree(A->data);CHKERRQ(ierr);
20c094ef40SMatthew G. Knepley   ierr = PetscObjectChangeTypeName((PetscObject) A, 0);CHKERRQ(ierr);
21c094ef40SMatthew G. Knepley   ierr = PetscObjectComposeFunction((PetscObject) A, "MatPreallocatorPreallocate_C", NULL);CHKERRQ(ierr);
22c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
23c094ef40SMatthew G. Knepley }
24c094ef40SMatthew G. Knepley 
25c094ef40SMatthew G. Knepley PetscErrorCode MatSetUp_Preallocator(Mat A)
26c094ef40SMatthew G. Knepley {
27c094ef40SMatthew G. Knepley   Mat_Preallocator *p = (Mat_Preallocator *) A->data;
28c094ef40SMatthew G. Knepley   PetscInt          m, bs;
29c094ef40SMatthew G. Knepley   PetscErrorCode    ierr;
30c094ef40SMatthew G. Knepley 
31c094ef40SMatthew G. Knepley   PetscFunctionBegin;
32c094ef40SMatthew G. Knepley   ierr = PetscLayoutSetUp(A->rmap);CHKERRQ(ierr);
33c094ef40SMatthew G. Knepley   ierr = PetscLayoutSetUp(A->cmap);CHKERRQ(ierr);
34c094ef40SMatthew G. Knepley   ierr = MatGetLocalSize(A, &m, NULL);CHKERRQ(ierr);
35e8f14785SLisandro Dalcin   ierr = PetscHSetIJCreate(&p->ht);CHKERRQ(ierr);
36c094ef40SMatthew G. Knepley   ierr = MatGetBlockSize(A, &bs);CHKERRQ(ierr);
37c094ef40SMatthew G. Knepley   ierr = MatStashCreate_Private(PetscObjectComm((PetscObject) A), bs, &A->stash);CHKERRQ(ierr);
38*c09129f1SStefano Zampini   ierr = PetscCalloc4(m, &p->dnz, m, &p->onz, m, &p->dnzu, m, &p->onzu);CHKERRQ(ierr);
39c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
40c094ef40SMatthew G. Knepley }
41c094ef40SMatthew G. Knepley 
42c094ef40SMatthew G. Knepley PetscErrorCode MatSetValues_Preallocator(Mat A, PetscInt m, const PetscInt *rows, PetscInt n, const PetscInt *cols, const PetscScalar *values, InsertMode addv)
43c094ef40SMatthew G. Knepley {
44c094ef40SMatthew G. Knepley   Mat_Preallocator *p = (Mat_Preallocator *) A->data;
45c094ef40SMatthew G. Knepley   PetscInt          rStart, rEnd, r, cStart, cEnd, c;
46c094ef40SMatthew G. Knepley   PetscErrorCode    ierr;
47c094ef40SMatthew G. Knepley 
48c094ef40SMatthew G. Knepley   PetscFunctionBegin;
49c094ef40SMatthew G. Knepley   /* TODO: Handle blocksize */
50c094ef40SMatthew G. Knepley   ierr = MatGetOwnershipRange(A, &rStart, &rEnd);CHKERRQ(ierr);
51c094ef40SMatthew G. Knepley   ierr = MatGetOwnershipRangeColumn(A, &cStart, &cEnd);CHKERRQ(ierr);
52c094ef40SMatthew G. Knepley   for (r = 0; r < m; ++r) {
53e8f14785SLisandro Dalcin     PetscHashIJKey key;
54e8f14785SLisandro Dalcin     PetscBool      missing;
55c094ef40SMatthew G. Knepley 
56e8f14785SLisandro Dalcin     key.i = rows[r];
57e8f14785SLisandro Dalcin     if (key.i < 0) continue;
58e8f14785SLisandro Dalcin     if ((key.i < rStart) || (key.i >= rEnd)) {
59e8f14785SLisandro Dalcin       ierr = MatStashValuesRow_Private(&A->stash, key.i, n, cols, values, PETSC_FALSE);CHKERRQ(ierr);
60c094ef40SMatthew G. Knepley     } else {
61c094ef40SMatthew G. Knepley       for (c = 0; c < n; ++c) {
62e8f14785SLisandro Dalcin         key.j = cols[c];
63e8f14785SLisandro Dalcin         if (key.j < 0) continue;
64e8f14785SLisandro Dalcin         ierr = PetscHSetIJQueryAdd(p->ht, key, &missing);CHKERRQ(ierr);
65c094ef40SMatthew G. Knepley         if (missing) {
66*c09129f1SStefano Zampini           if ((key.j >= cStart) && (key.j < cEnd)) {
67*c09129f1SStefano Zampini             ++p->dnz[key.i-rStart];
68*c09129f1SStefano Zampini             if (key.j >= key.i) ++p->dnzu[key.i-rStart];
69*c09129f1SStefano Zampini           } else {
70*c09129f1SStefano Zampini             ++p->onz[key.i-rStart];
71*c09129f1SStefano Zampini             if (key.j >= key.i) ++p->onzu[key.i-rStart];
72*c09129f1SStefano Zampini           }
73c094ef40SMatthew G. Knepley         }
74c094ef40SMatthew G. Knepley       }
75c094ef40SMatthew G. Knepley     }
76c094ef40SMatthew G. Knepley   }
77c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
78c094ef40SMatthew G. Knepley }
79c094ef40SMatthew G. Knepley 
80c094ef40SMatthew G. Knepley PetscErrorCode MatAssemblyBegin_Preallocator(Mat A, MatAssemblyType type)
81c094ef40SMatthew G. Knepley {
82c094ef40SMatthew G. Knepley   PetscInt       nstash, reallocs;
83c094ef40SMatthew G. Knepley   PetscErrorCode ierr;
84c094ef40SMatthew G. Knepley 
85c094ef40SMatthew G. Knepley   PetscFunctionBegin;
86c094ef40SMatthew G. Knepley   ierr = MatStashScatterBegin_Private(A, &A->stash, A->rmap->range);CHKERRQ(ierr);
87c094ef40SMatthew G. Knepley   ierr = MatStashGetInfo_Private(&A->stash, &nstash, &reallocs);CHKERRQ(ierr);
88c094ef40SMatthew G. Knepley   ierr = PetscInfo2(A, "Stash has %D entries, uses %D mallocs.\n", nstash, reallocs);CHKERRQ(ierr);
89c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
90c094ef40SMatthew G. Knepley }
91c094ef40SMatthew G. Knepley 
92c094ef40SMatthew G. Knepley PetscErrorCode MatAssemblyEnd_Preallocator(Mat A, MatAssemblyType type)
93c094ef40SMatthew G. Knepley {
94c094ef40SMatthew G. Knepley   PetscScalar   *val;
95c094ef40SMatthew G. Knepley   PetscInt      *row, *col;
96c094ef40SMatthew G. Knepley   PetscInt       i, j, rstart, ncols, flg;
97c094ef40SMatthew G. Knepley   PetscMPIInt    n;
98c094ef40SMatthew G. Knepley   PetscErrorCode ierr;
99c094ef40SMatthew G. Knepley 
100c094ef40SMatthew G. Knepley   PetscFunctionBegin;
101c094ef40SMatthew G. Knepley   while (1) {
102c094ef40SMatthew G. Knepley     ierr = MatStashScatterGetMesg_Private(&A->stash, &n, &row, &col, &val, &flg);CHKERRQ(ierr);
103c094ef40SMatthew G. Knepley     if (!flg) break;
104c094ef40SMatthew G. Knepley 
105c094ef40SMatthew G. Knepley     for (i = 0; i < n; ) {
106c094ef40SMatthew G. Knepley       /* Now identify the consecutive vals belonging to the same row */
107c094ef40SMatthew G. Knepley       for (j = i, rstart = row[j]; j < n; j++) {
108c094ef40SMatthew G. Knepley         if (row[j] != rstart) break;
109c094ef40SMatthew G. Knepley       }
110c094ef40SMatthew G. Knepley       if (j < n) ncols = j-i;
111c094ef40SMatthew G. Knepley       else       ncols = n-i;
112c094ef40SMatthew G. Knepley       /* Now assemble all these values with a single function call */
113c094ef40SMatthew G. Knepley       ierr = MatSetValues_Preallocator(A, 1, row+i, ncols, col+i, val+i, INSERT_VALUES);CHKERRQ(ierr);
114c094ef40SMatthew G. Knepley       i = j;
115c094ef40SMatthew G. Knepley     }
116c094ef40SMatthew G. Knepley   }
117c094ef40SMatthew G. Knepley   ierr = MatStashScatterEnd_Private(&A->stash);CHKERRQ(ierr);
118c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
119c094ef40SMatthew G. Knepley }
120c094ef40SMatthew G. Knepley 
121c094ef40SMatthew G. Knepley PetscErrorCode MatView_Preallocator(Mat A, PetscViewer viewer)
122c094ef40SMatthew G. Knepley {
123c094ef40SMatthew G. Knepley   PetscFunctionBegin;
124c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
125c094ef40SMatthew G. Knepley }
126c094ef40SMatthew G. Knepley 
127c094ef40SMatthew G. Knepley PetscErrorCode MatSetOption_Preallocator(Mat A, MatOption op, PetscBool flg)
128c094ef40SMatthew G. Knepley {
129c094ef40SMatthew G. Knepley   PetscFunctionBegin;
130c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
131c094ef40SMatthew G. Knepley }
132c094ef40SMatthew G. Knepley 
133c094ef40SMatthew G. Knepley PetscErrorCode MatPreallocatorPreallocate_Preallocator(Mat mat, PetscBool fill, Mat A)
134c094ef40SMatthew G. Knepley {
135c094ef40SMatthew G. Knepley   Mat_Preallocator *p = (Mat_Preallocator *) mat->data;
136c094ef40SMatthew G. Knepley   PetscInt          bs;
137c094ef40SMatthew G. Knepley   PetscErrorCode    ierr;
138c094ef40SMatthew G. Knepley 
139c094ef40SMatthew G. Knepley   PetscFunctionBegin;
140c094ef40SMatthew G. Knepley   ierr = MatGetBlockSize(mat, &bs);CHKERRQ(ierr);
141*c09129f1SStefano Zampini   ierr = MatXAIJSetPreallocation(A, bs, p->dnz, p->onz, p->dnzu, p->onzu);CHKERRQ(ierr);
142c094ef40SMatthew G. Knepley   ierr = MatSetOption(A, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE);CHKERRQ(ierr);
143c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
144c094ef40SMatthew G. Knepley }
145c094ef40SMatthew G. Knepley 
146c094ef40SMatthew G. Knepley /*@
147c094ef40SMatthew G. Knepley   MatPreallocatorPreallocate - Preallocates the input matrix, optionally filling it with zeros
148c094ef40SMatthew G. Knepley 
149c094ef40SMatthew G. Knepley   Input Parameter:
150c094ef40SMatthew G. Knepley + mat  - the preallocator
151c094ef40SMatthew G. Knepley - fill - fill the matrix with zeros
152c094ef40SMatthew G. Knepley 
153c094ef40SMatthew G. Knepley   Output Parameter:
154c094ef40SMatthew G. Knepley . A    - the matrix
155c094ef40SMatthew G. Knepley 
156c094ef40SMatthew G. Knepley   Level: advanced
157c094ef40SMatthew G. Knepley 
158c094ef40SMatthew G. Knepley .seealso: MATPREALLOCATOR
159c094ef40SMatthew G. Knepley @*/
160c094ef40SMatthew G. Knepley PetscErrorCode MatPreallocatorPreallocate(Mat mat, PetscBool fill, Mat A)
161c094ef40SMatthew G. Knepley {
162c094ef40SMatthew G. Knepley   PetscErrorCode ierr;
163c094ef40SMatthew G. Knepley 
164c094ef40SMatthew G. Knepley   PetscFunctionBegin;
165c094ef40SMatthew G. Knepley   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
166c094ef40SMatthew G. Knepley   PetscValidHeaderSpecific(A,   MAT_CLASSID, 3);
167c094ef40SMatthew G. Knepley   ierr = PetscUseMethod(mat, "MatPreallocatorPreallocate_C", (Mat,PetscBool,Mat),(mat,fill,A));CHKERRQ(ierr);
168c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
169c094ef40SMatthew G. Knepley }
170c094ef40SMatthew G. Knepley 
171c094ef40SMatthew G. Knepley /*MC
172c094ef40SMatthew G. Knepley    MATPREALLOCATOR - MATPREALLOCATOR = "preallocator" - A matrix type to be used for computing a matrix preallocation.
173c094ef40SMatthew G. Knepley 
174c094ef40SMatthew G. Knepley    Operations Provided:
175c094ef40SMatthew G. Knepley .  MatSetValues()
176c094ef40SMatthew G. Knepley 
177c094ef40SMatthew G. Knepley    Options Database Keys:
178c094ef40SMatthew G. Knepley . -mat_type preallocator - sets the matrix type to "preallocator" during a call to MatSetFromOptions()
179c094ef40SMatthew G. Knepley 
180c094ef40SMatthew G. Knepley   Level: advanced
181c094ef40SMatthew G. Knepley 
182c094ef40SMatthew G. Knepley .seealso: Mat
183c094ef40SMatthew G. Knepley 
184c094ef40SMatthew G. Knepley M*/
185c094ef40SMatthew G. Knepley 
186c094ef40SMatthew G. Knepley PETSC_EXTERN PetscErrorCode MatCreate_Preallocator(Mat A)
187c094ef40SMatthew G. Knepley {
188c094ef40SMatthew G. Knepley   Mat_Preallocator *p;
189c094ef40SMatthew G. Knepley   PetscErrorCode    ierr;
190c094ef40SMatthew G. Knepley 
191c094ef40SMatthew G. Knepley   PetscFunctionBegin;
192c094ef40SMatthew G. Knepley   ierr = PetscNewLog(A, &p);CHKERRQ(ierr);
193c094ef40SMatthew G. Knepley   A->data = (void *) p;
194c094ef40SMatthew G. Knepley 
195c094ef40SMatthew G. Knepley   p->ht   = NULL;
196c094ef40SMatthew G. Knepley   p->dnz  = NULL;
197c094ef40SMatthew G. Knepley   p->onz  = NULL;
198*c09129f1SStefano Zampini   p->dnzu = NULL;
199*c09129f1SStefano Zampini   p->onzu = NULL;
200c094ef40SMatthew G. Knepley 
201c094ef40SMatthew G. Knepley   /* matrix ops */
202c094ef40SMatthew G. Knepley   ierr = PetscMemzero(A->ops, sizeof(struct _MatOps));CHKERRQ(ierr);
203*c09129f1SStefano Zampini 
204c094ef40SMatthew G. Knepley   A->ops->destroy       = MatDestroy_Preallocator;
205c094ef40SMatthew G. Knepley   A->ops->setup         = MatSetUp_Preallocator;
206c094ef40SMatthew G. Knepley   A->ops->setvalues     = MatSetValues_Preallocator;
207c094ef40SMatthew G. Knepley   A->ops->assemblybegin = MatAssemblyBegin_Preallocator;
208c094ef40SMatthew G. Knepley   A->ops->assemblyend   = MatAssemblyEnd_Preallocator;
209c094ef40SMatthew G. Knepley   A->ops->view          = MatView_Preallocator;
210c094ef40SMatthew G. Knepley   A->ops->setoption     = MatSetOption_Preallocator;
211c094ef40SMatthew G. Knepley 
212c094ef40SMatthew G. Knepley   /* special MATPREALLOCATOR functions */
213c094ef40SMatthew G. Knepley   ierr = PetscObjectComposeFunction((PetscObject) A, "MatPreallocatorPreallocate_C", MatPreallocatorPreallocate_Preallocator);CHKERRQ(ierr);
214c094ef40SMatthew G. Knepley   ierr = PetscObjectChangeTypeName((PetscObject) A, MATPREALLOCATOR);CHKERRQ(ierr);
215c094ef40SMatthew G. Knepley   PetscFunctionReturn(0);
216c094ef40SMatthew G. Knepley }
217