1cb1e1211SMatthew G Knepley #include <petsc-private/dmpleximpl.h> /*I "petscdmplex.h" I*/ 2cb1e1211SMatthew G Knepley 3a0845e3aSMatthew G. Knepley #include <petscfe.h> 4a0845e3aSMatthew G. Knepley 5cb1e1211SMatthew G Knepley #undef __FUNCT__ 6cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexGetScale" 7cb1e1211SMatthew G Knepley PetscErrorCode DMPlexGetScale(DM dm, PetscUnit unit, PetscReal *scale) 8cb1e1211SMatthew G Knepley { 9cb1e1211SMatthew G Knepley DM_Plex *mesh = (DM_Plex*) dm->data; 10cb1e1211SMatthew G Knepley 11cb1e1211SMatthew G Knepley PetscFunctionBegin; 12cb1e1211SMatthew G Knepley PetscValidHeaderSpecific(dm, DM_CLASSID, 1); 13cb1e1211SMatthew G Knepley PetscValidPointer(scale, 3); 14cb1e1211SMatthew G Knepley *scale = mesh->scale[unit]; 15cb1e1211SMatthew G Knepley PetscFunctionReturn(0); 16cb1e1211SMatthew G Knepley } 17cb1e1211SMatthew G Knepley 18cb1e1211SMatthew G Knepley #undef __FUNCT__ 19cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexSetScale" 20cb1e1211SMatthew G Knepley PetscErrorCode DMPlexSetScale(DM dm, PetscUnit unit, PetscReal scale) 21cb1e1211SMatthew G Knepley { 22cb1e1211SMatthew G Knepley DM_Plex *mesh = (DM_Plex*) dm->data; 23cb1e1211SMatthew G Knepley 24cb1e1211SMatthew G Knepley PetscFunctionBegin; 25cb1e1211SMatthew G Knepley PetscValidHeaderSpecific(dm, DM_CLASSID, 1); 26cb1e1211SMatthew G Knepley mesh->scale[unit] = scale; 27cb1e1211SMatthew G Knepley PetscFunctionReturn(0); 28cb1e1211SMatthew G Knepley } 29cb1e1211SMatthew G Knepley 30cb1e1211SMatthew G Knepley PETSC_STATIC_INLINE PetscInt epsilon(PetscInt i, PetscInt j, PetscInt k) 31cb1e1211SMatthew G Knepley { 32cb1e1211SMatthew G Knepley switch (i) { 33cb1e1211SMatthew G Knepley case 0: 34cb1e1211SMatthew G Knepley switch (j) { 35cb1e1211SMatthew G Knepley case 0: return 0; 36cb1e1211SMatthew G Knepley case 1: 37cb1e1211SMatthew G Knepley switch (k) { 38cb1e1211SMatthew G Knepley case 0: return 0; 39cb1e1211SMatthew G Knepley case 1: return 0; 40cb1e1211SMatthew G Knepley case 2: return 1; 41cb1e1211SMatthew G Knepley } 42cb1e1211SMatthew G Knepley case 2: 43cb1e1211SMatthew G Knepley switch (k) { 44cb1e1211SMatthew G Knepley case 0: return 0; 45cb1e1211SMatthew G Knepley case 1: return -1; 46cb1e1211SMatthew G Knepley case 2: return 0; 47cb1e1211SMatthew G Knepley } 48cb1e1211SMatthew G Knepley } 49cb1e1211SMatthew G Knepley case 1: 50cb1e1211SMatthew G Knepley switch (j) { 51cb1e1211SMatthew G Knepley case 0: 52cb1e1211SMatthew G Knepley switch (k) { 53cb1e1211SMatthew G Knepley case 0: return 0; 54cb1e1211SMatthew G Knepley case 1: return 0; 55cb1e1211SMatthew G Knepley case 2: return -1; 56cb1e1211SMatthew G Knepley } 57cb1e1211SMatthew G Knepley case 1: return 0; 58cb1e1211SMatthew G Knepley case 2: 59cb1e1211SMatthew G Knepley switch (k) { 60cb1e1211SMatthew G Knepley case 0: return 1; 61cb1e1211SMatthew G Knepley case 1: return 0; 62cb1e1211SMatthew G Knepley case 2: return 0; 63cb1e1211SMatthew G Knepley } 64cb1e1211SMatthew G Knepley } 65cb1e1211SMatthew G Knepley case 2: 66cb1e1211SMatthew G Knepley switch (j) { 67cb1e1211SMatthew G Knepley case 0: 68cb1e1211SMatthew G Knepley switch (k) { 69cb1e1211SMatthew G Knepley case 0: return 0; 70cb1e1211SMatthew G Knepley case 1: return 1; 71cb1e1211SMatthew G Knepley case 2: return 0; 72cb1e1211SMatthew G Knepley } 73cb1e1211SMatthew G Knepley case 1: 74cb1e1211SMatthew G Knepley switch (k) { 75cb1e1211SMatthew G Knepley case 0: return -1; 76cb1e1211SMatthew G Knepley case 1: return 0; 77cb1e1211SMatthew G Knepley case 2: return 0; 78cb1e1211SMatthew G Knepley } 79cb1e1211SMatthew G Knepley case 2: return 0; 80cb1e1211SMatthew G Knepley } 81cb1e1211SMatthew G Knepley } 82cb1e1211SMatthew G Knepley return 0; 83cb1e1211SMatthew G Knepley } 84cb1e1211SMatthew G Knepley 85cb1e1211SMatthew G Knepley #undef __FUNCT__ 86cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexCreateRigidBody" 87cb1e1211SMatthew G Knepley /*@C 88cb1e1211SMatthew G Knepley DMPlexCreateRigidBody - create rigid body modes from coordinates 89cb1e1211SMatthew G Knepley 90cb1e1211SMatthew G Knepley Collective on DM 91cb1e1211SMatthew G Knepley 92cb1e1211SMatthew G Knepley Input Arguments: 93cb1e1211SMatthew G Knepley + dm - the DM 94cb1e1211SMatthew G Knepley . section - the local section associated with the rigid field, or NULL for the default section 95cb1e1211SMatthew G Knepley - globalSection - the global section associated with the rigid field, or NULL for the default section 96cb1e1211SMatthew G Knepley 97cb1e1211SMatthew G Knepley Output Argument: 98cb1e1211SMatthew G Knepley . sp - the null space 99cb1e1211SMatthew G Knepley 100cb1e1211SMatthew G Knepley Note: This is necessary to take account of Dirichlet conditions on the displacements 101cb1e1211SMatthew G Knepley 102cb1e1211SMatthew G Knepley Level: advanced 103cb1e1211SMatthew G Knepley 104cb1e1211SMatthew G Knepley .seealso: MatNullSpaceCreate() 105cb1e1211SMatthew G Knepley @*/ 106cb1e1211SMatthew G Knepley PetscErrorCode DMPlexCreateRigidBody(DM dm, PetscSection section, PetscSection globalSection, MatNullSpace *sp) 107cb1e1211SMatthew G Knepley { 108cb1e1211SMatthew G Knepley MPI_Comm comm; 109cb1e1211SMatthew G Knepley Vec coordinates, localMode, mode[6]; 110cb1e1211SMatthew G Knepley PetscSection coordSection; 111cb1e1211SMatthew G Knepley PetscScalar *coords; 112cb1e1211SMatthew G Knepley PetscInt dim, vStart, vEnd, v, n, m, d, i, j; 113cb1e1211SMatthew G Knepley PetscErrorCode ierr; 114cb1e1211SMatthew G Knepley 115cb1e1211SMatthew G Knepley PetscFunctionBegin; 116cb1e1211SMatthew G Knepley ierr = PetscObjectGetComm((PetscObject)dm,&comm);CHKERRQ(ierr); 117cb1e1211SMatthew G Knepley ierr = DMPlexGetDimension(dm, &dim);CHKERRQ(ierr); 118cb1e1211SMatthew G Knepley if (dim == 1) { 119cb1e1211SMatthew G Knepley ierr = MatNullSpaceCreate(comm, PETSC_TRUE, 0, NULL, sp);CHKERRQ(ierr); 120cb1e1211SMatthew G Knepley PetscFunctionReturn(0); 121cb1e1211SMatthew G Knepley } 122cb1e1211SMatthew G Knepley if (!section) {ierr = DMGetDefaultSection(dm, §ion);CHKERRQ(ierr);} 123cb1e1211SMatthew G Knepley if (!globalSection) {ierr = DMGetDefaultGlobalSection(dm, &globalSection);CHKERRQ(ierr);} 124cb1e1211SMatthew G Knepley ierr = PetscSectionGetConstrainedStorageSize(globalSection, &n);CHKERRQ(ierr); 125cb1e1211SMatthew G Knepley ierr = DMPlexGetDepthStratum(dm, 0, &vStart, &vEnd);CHKERRQ(ierr); 126cb1e1211SMatthew G Knepley ierr = DMPlexGetCoordinateSection(dm, &coordSection);CHKERRQ(ierr); 127cb1e1211SMatthew G Knepley ierr = DMGetCoordinatesLocal(dm, &coordinates);CHKERRQ(ierr); 128cb1e1211SMatthew G Knepley m = (dim*(dim+1))/2; 129cb1e1211SMatthew G Knepley ierr = VecCreate(comm, &mode[0]);CHKERRQ(ierr); 130cb1e1211SMatthew G Knepley ierr = VecSetSizes(mode[0], n, PETSC_DETERMINE);CHKERRQ(ierr); 131cb1e1211SMatthew G Knepley ierr = VecSetUp(mode[0]);CHKERRQ(ierr); 132cb1e1211SMatthew G Knepley for (i = 1; i < m; ++i) {ierr = VecDuplicate(mode[0], &mode[i]);CHKERRQ(ierr);} 133cb1e1211SMatthew G Knepley /* Assume P1 */ 134cb1e1211SMatthew G Knepley ierr = DMGetLocalVector(dm, &localMode);CHKERRQ(ierr); 135cb1e1211SMatthew G Knepley for (d = 0; d < dim; ++d) { 136cb1e1211SMatthew G Knepley PetscScalar values[3] = {0.0, 0.0, 0.0}; 137cb1e1211SMatthew G Knepley 138cb1e1211SMatthew G Knepley values[d] = 1.0; 139cb1e1211SMatthew G Knepley ierr = VecSet(localMode, 0.0);CHKERRQ(ierr); 140cb1e1211SMatthew G Knepley for (v = vStart; v < vEnd; ++v) { 141cb1e1211SMatthew G Knepley ierr = DMPlexVecSetClosure(dm, section, localMode, v, values, INSERT_VALUES);CHKERRQ(ierr); 142cb1e1211SMatthew G Knepley } 143cb1e1211SMatthew G Knepley ierr = DMLocalToGlobalBegin(dm, localMode, INSERT_VALUES, mode[d]);CHKERRQ(ierr); 144cb1e1211SMatthew G Knepley ierr = DMLocalToGlobalEnd(dm, localMode, INSERT_VALUES, mode[d]);CHKERRQ(ierr); 145cb1e1211SMatthew G Knepley } 146cb1e1211SMatthew G Knepley ierr = VecGetArray(coordinates, &coords);CHKERRQ(ierr); 147cb1e1211SMatthew G Knepley for (d = dim; d < dim*(dim+1)/2; ++d) { 148cb1e1211SMatthew G Knepley PetscInt i, j, k = dim > 2 ? d - dim : d; 149cb1e1211SMatthew G Knepley 150cb1e1211SMatthew G Knepley ierr = VecSet(localMode, 0.0);CHKERRQ(ierr); 151cb1e1211SMatthew G Knepley for (v = vStart; v < vEnd; ++v) { 152cb1e1211SMatthew G Knepley PetscScalar values[3] = {0.0, 0.0, 0.0}; 153cb1e1211SMatthew G Knepley PetscInt off; 154cb1e1211SMatthew G Knepley 155cb1e1211SMatthew G Knepley ierr = PetscSectionGetOffset(coordSection, v, &off);CHKERRQ(ierr); 156cb1e1211SMatthew G Knepley for (i = 0; i < dim; ++i) { 157cb1e1211SMatthew G Knepley for (j = 0; j < dim; ++j) { 158cb1e1211SMatthew G Knepley values[j] += epsilon(i, j, k)*PetscRealPart(coords[off+i]); 159cb1e1211SMatthew G Knepley } 160cb1e1211SMatthew G Knepley } 161cb1e1211SMatthew G Knepley ierr = DMPlexVecSetClosure(dm, section, localMode, v, values, INSERT_VALUES);CHKERRQ(ierr); 162cb1e1211SMatthew G Knepley } 163cb1e1211SMatthew G Knepley ierr = DMLocalToGlobalBegin(dm, localMode, INSERT_VALUES, mode[d]);CHKERRQ(ierr); 164cb1e1211SMatthew G Knepley ierr = DMLocalToGlobalEnd(dm, localMode, INSERT_VALUES, mode[d]);CHKERRQ(ierr); 165cb1e1211SMatthew G Knepley } 166cb1e1211SMatthew G Knepley ierr = VecRestoreArray(coordinates, &coords);CHKERRQ(ierr); 167cb1e1211SMatthew G Knepley ierr = DMRestoreLocalVector(dm, &localMode);CHKERRQ(ierr); 168cb1e1211SMatthew G Knepley for (i = 0; i < dim; ++i) {ierr = VecNormalize(mode[i], NULL);CHKERRQ(ierr);} 169cb1e1211SMatthew G Knepley /* Orthonormalize system */ 170cb1e1211SMatthew G Knepley for (i = dim; i < m; ++i) { 171cb1e1211SMatthew G Knepley PetscScalar dots[6]; 172cb1e1211SMatthew G Knepley 173cb1e1211SMatthew G Knepley ierr = VecMDot(mode[i], i, mode, dots);CHKERRQ(ierr); 174cb1e1211SMatthew G Knepley for (j = 0; j < i; ++j) dots[j] *= -1.0; 175cb1e1211SMatthew G Knepley ierr = VecMAXPY(mode[i], i, dots, mode);CHKERRQ(ierr); 176cb1e1211SMatthew G Knepley ierr = VecNormalize(mode[i], NULL);CHKERRQ(ierr); 177cb1e1211SMatthew G Knepley } 178cb1e1211SMatthew G Knepley ierr = MatNullSpaceCreate(comm, PETSC_FALSE, m, mode, sp);CHKERRQ(ierr); 179cb1e1211SMatthew G Knepley for (i = 0; i< m; ++i) {ierr = VecDestroy(&mode[i]);CHKERRQ(ierr);} 180cb1e1211SMatthew G Knepley PetscFunctionReturn(0); 181cb1e1211SMatthew G Knepley } 182cb1e1211SMatthew G Knepley 183cb1e1211SMatthew G Knepley #undef __FUNCT__ 184cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexProjectFunctionLocal" 18572f94c41SMatthew G. Knepley PetscErrorCode DMPlexProjectFunctionLocal(DM dm, PetscFE fe[], void (**funcs)(const PetscReal [], PetscScalar *), InsertMode mode, Vec localX) 186cb1e1211SMatthew G Knepley { 18772f94c41SMatthew G. Knepley PetscDualSpace *sp; 18872f94c41SMatthew G. Knepley PetscSection section; 18972f94c41SMatthew G. Knepley PetscScalar *values; 19072f94c41SMatthew G. Knepley PetscReal *v0, *J, detJ; 19172f94c41SMatthew G. Knepley PetscInt numFields, numComp, dim, spDim, totDim = 0, numValues, cStart, cEnd, c, f, d, v; 192cb1e1211SMatthew G Knepley PetscErrorCode ierr; 193cb1e1211SMatthew G Knepley 194cb1e1211SMatthew G Knepley PetscFunctionBegin; 195cb1e1211SMatthew G Knepley ierr = DMGetDefaultSection(dm, §ion);CHKERRQ(ierr); 19672f94c41SMatthew G. Knepley ierr = PetscSectionGetNumFields(section, &numFields);CHKERRQ(ierr); 197785e854fSJed Brown ierr = PetscMalloc1(numFields, &sp);CHKERRQ(ierr); 19872f94c41SMatthew G. Knepley for (f = 0; f < numFields; ++f) { 19972f94c41SMatthew G. Knepley ierr = PetscFEGetDualSpace(fe[f], &sp[f]);CHKERRQ(ierr); 20072f94c41SMatthew G. Knepley ierr = PetscFEGetNumComponents(fe[f], &numComp);CHKERRQ(ierr); 20172f94c41SMatthew G. Knepley ierr = PetscDualSpaceGetDimension(sp[f], &spDim);CHKERRQ(ierr); 20272f94c41SMatthew G. Knepley totDim += spDim*numComp; 203cb1e1211SMatthew G Knepley } 20472f94c41SMatthew G. Knepley ierr = DMPlexGetDimension(dm, &dim);CHKERRQ(ierr); 20572f94c41SMatthew G. Knepley ierr = DMPlexGetHeightStratum(dm, 0, &cStart, &cEnd);CHKERRQ(ierr); 20672f94c41SMatthew G. Knepley ierr = DMPlexVecGetClosure(dm, section, localX, cStart, &numValues, NULL);CHKERRQ(ierr); 20772f94c41SMatthew G. Knepley if (numValues != totDim) SETERRQ2(PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "The section cell closure size %d != dual space dimension %d", numValues, totDim); 20872f94c41SMatthew G. Knepley ierr = DMGetWorkArray(dm, numValues, PETSC_SCALAR, &values);CHKERRQ(ierr); 209dcca6d9dSJed Brown ierr = PetscMalloc2(dim,&v0,dim*dim,&J);CHKERRQ(ierr); 21072f94c41SMatthew G. Knepley for (c = cStart; c < cEnd; ++c) { 21172f94c41SMatthew G. Knepley PetscCellGeometry geom; 212cb1e1211SMatthew G Knepley 213cb1e1211SMatthew G Knepley ierr = DMPlexComputeCellGeometry(dm, c, v0, J, NULL, &detJ);CHKERRQ(ierr); 21472f94c41SMatthew G. Knepley geom.v0 = v0; 21572f94c41SMatthew G. Knepley geom.J = J; 21672f94c41SMatthew G. Knepley geom.detJ = &detJ; 21772f94c41SMatthew G. Knepley for (f = 0, v = 0; f < numFields; ++f) { 21872f94c41SMatthew G. Knepley ierr = PetscFEGetNumComponents(fe[f], &numComp);CHKERRQ(ierr); 21972f94c41SMatthew G. Knepley ierr = PetscDualSpaceGetDimension(sp[f], &spDim);CHKERRQ(ierr); 22072f94c41SMatthew G. Knepley for (d = 0; d < spDim; ++d) { 22172f94c41SMatthew G. Knepley ierr = PetscDualSpaceApply(sp[f], d, geom, numComp, funcs[f], &values[v]);CHKERRQ(ierr); 22272f94c41SMatthew G. Knepley v += numComp; 223cb1e1211SMatthew G Knepley } 224cb1e1211SMatthew G Knepley } 22572f94c41SMatthew G. Knepley ierr = DMPlexVecSetClosure(dm, section, localX, c, values, mode);CHKERRQ(ierr); 226cb1e1211SMatthew G Knepley } 22772f94c41SMatthew G. Knepley ierr = DMRestoreWorkArray(dm, numValues, PETSC_SCALAR, &values);CHKERRQ(ierr); 2281f2da991SMatthew G. Knepley ierr = PetscFree2(v0,J);CHKERRQ(ierr); 22972f94c41SMatthew G. Knepley ierr = PetscFree(sp);CHKERRQ(ierr); 230cb1e1211SMatthew G Knepley PetscFunctionReturn(0); 231cb1e1211SMatthew G Knepley } 232cb1e1211SMatthew G Knepley 233cb1e1211SMatthew G Knepley #undef __FUNCT__ 234cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexProjectFunction" 235cb1e1211SMatthew G Knepley /*@C 236cb1e1211SMatthew G Knepley DMPlexProjectFunction - This projects the given function into the function space provided. 237cb1e1211SMatthew G Knepley 238cb1e1211SMatthew G Knepley Input Parameters: 239cb1e1211SMatthew G Knepley + dm - The DM 24072f94c41SMatthew G. Knepley . fe - The PetscFE associated with the field 24172f94c41SMatthew G. Knepley . funcs - The coordinate functions to evaluate, one per field 242cb1e1211SMatthew G Knepley - mode - The insertion mode for values 243cb1e1211SMatthew G Knepley 244cb1e1211SMatthew G Knepley Output Parameter: 245cb1e1211SMatthew G Knepley . X - vector 246cb1e1211SMatthew G Knepley 247cb1e1211SMatthew G Knepley Level: developer 248cb1e1211SMatthew G Knepley 249878cb397SSatish Balay .seealso: DMPlexComputeL2Diff() 250878cb397SSatish Balay @*/ 25172f94c41SMatthew G. Knepley PetscErrorCode DMPlexProjectFunction(DM dm, PetscFE fe[], void (**funcs)(const PetscReal [], PetscScalar *), InsertMode mode, Vec X) 252cb1e1211SMatthew G Knepley { 253cb1e1211SMatthew G Knepley Vec localX; 254cb1e1211SMatthew G Knepley PetscErrorCode ierr; 255cb1e1211SMatthew G Knepley 256cb1e1211SMatthew G Knepley PetscFunctionBegin; 257*9a800dd8SMatthew G. Knepley PetscValidHeaderSpecific(dm, DM_CLASSID, 1); 258cb1e1211SMatthew G Knepley ierr = DMGetLocalVector(dm, &localX);CHKERRQ(ierr); 25972f94c41SMatthew G. Knepley ierr = DMPlexProjectFunctionLocal(dm, fe, funcs, mode, localX);CHKERRQ(ierr); 260cb1e1211SMatthew G Knepley ierr = DMLocalToGlobalBegin(dm, localX, mode, X);CHKERRQ(ierr); 261cb1e1211SMatthew G Knepley ierr = DMLocalToGlobalEnd(dm, localX, mode, X);CHKERRQ(ierr); 262cb1e1211SMatthew G Knepley ierr = DMRestoreLocalVector(dm, &localX);CHKERRQ(ierr); 263cb1e1211SMatthew G Knepley PetscFunctionReturn(0); 264cb1e1211SMatthew G Knepley } 265cb1e1211SMatthew G Knepley 266cb1e1211SMatthew G Knepley #undef __FUNCT__ 267cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexComputeL2Diff" 268cb1e1211SMatthew G Knepley /*@C 269cb1e1211SMatthew G Knepley DMPlexComputeL2Diff - This function computes the L_2 difference between a function u and an FEM interpolant solution u_h. 270cb1e1211SMatthew G Knepley 271cb1e1211SMatthew G Knepley Input Parameters: 272cb1e1211SMatthew G Knepley + dm - The DM 273c5bbbd5bSMatthew G. Knepley . fe - The PetscFE object for each field 274cb1e1211SMatthew G Knepley . funcs - The functions to evaluate for each field component 275cb1e1211SMatthew G Knepley - X - The coefficient vector u_h 276cb1e1211SMatthew G Knepley 277cb1e1211SMatthew G Knepley Output Parameter: 278cb1e1211SMatthew G Knepley . diff - The diff ||u - u_h||_2 279cb1e1211SMatthew G Knepley 280cb1e1211SMatthew G Knepley Level: developer 281cb1e1211SMatthew G Knepley 282cb1e1211SMatthew G Knepley .seealso: DMPlexProjectFunction() 283878cb397SSatish Balay @*/ 284c5bbbd5bSMatthew G. Knepley PetscErrorCode DMPlexComputeL2Diff(DM dm, PetscFE fe[], void (**funcs)(const PetscReal [], PetscScalar *), Vec X, PetscReal *diff) 285cb1e1211SMatthew G Knepley { 286cb1e1211SMatthew G Knepley const PetscInt debug = 0; 287cb1e1211SMatthew G Knepley PetscSection section; 288c5bbbd5bSMatthew G. Knepley PetscQuadrature quad; 289cb1e1211SMatthew G Knepley Vec localX; 29072f94c41SMatthew G. Knepley PetscScalar *funcVal; 291cb1e1211SMatthew G Knepley PetscReal *coords, *v0, *J, *invJ, detJ; 292cb1e1211SMatthew G Knepley PetscReal localDiff = 0.0; 293cb1e1211SMatthew G Knepley PetscInt dim, numFields, numComponents = 0, cStart, cEnd, c, field, fieldOffset, comp; 294cb1e1211SMatthew G Knepley PetscErrorCode ierr; 295cb1e1211SMatthew G Knepley 296cb1e1211SMatthew G Knepley PetscFunctionBegin; 297cb1e1211SMatthew G Knepley ierr = DMPlexGetDimension(dm, &dim);CHKERRQ(ierr); 298cb1e1211SMatthew G Knepley ierr = DMGetDefaultSection(dm, §ion);CHKERRQ(ierr); 299cb1e1211SMatthew G Knepley ierr = PetscSectionGetNumFields(section, &numFields);CHKERRQ(ierr); 300cb1e1211SMatthew G Knepley ierr = DMGetLocalVector(dm, &localX);CHKERRQ(ierr); 301cb1e1211SMatthew G Knepley ierr = DMGlobalToLocalBegin(dm, X, INSERT_VALUES, localX);CHKERRQ(ierr); 302cb1e1211SMatthew G Knepley ierr = DMGlobalToLocalEnd(dm, X, INSERT_VALUES, localX);CHKERRQ(ierr); 303cb1e1211SMatthew G Knepley for (field = 0; field < numFields; ++field) { 304c5bbbd5bSMatthew G. Knepley PetscInt Nc; 305c5bbbd5bSMatthew G. Knepley 306c5bbbd5bSMatthew G. Knepley ierr = PetscFEGetNumComponents(fe[field], &Nc);CHKERRQ(ierr); 307c5bbbd5bSMatthew G. Knepley numComponents += Nc; 308cb1e1211SMatthew G Knepley } 30972f94c41SMatthew G. Knepley ierr = DMPlexProjectFunctionLocal(dm, fe, funcs, INSERT_BC_VALUES, localX);CHKERRQ(ierr); 310dcca6d9dSJed Brown ierr = PetscMalloc5(numComponents,&funcVal,dim,&coords,dim,&v0,dim*dim,&J,dim*dim,&invJ);CHKERRQ(ierr); 311cb1e1211SMatthew G Knepley ierr = DMPlexGetHeightStratum(dm, 0, &cStart, &cEnd);CHKERRQ(ierr); 312c5bbbd5bSMatthew G. Knepley ierr = PetscFEGetQuadrature(fe[0], &quad);CHKERRQ(ierr); 313cb1e1211SMatthew G Knepley for (c = cStart; c < cEnd; ++c) { 314a1e44745SMatthew G. Knepley PetscScalar *x = NULL; 315cb1e1211SMatthew G Knepley PetscReal elemDiff = 0.0; 316cb1e1211SMatthew G Knepley 317cb1e1211SMatthew G Knepley ierr = DMPlexComputeCellGeometry(dm, c, v0, J, invJ, &detJ);CHKERRQ(ierr); 318cb1e1211SMatthew G Knepley if (detJ <= 0.0) SETERRQ2(PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Invalid determinant %g for element %d", detJ, c); 319cb1e1211SMatthew G Knepley ierr = DMPlexVecGetClosure(dm, NULL, localX, c, NULL, &x);CHKERRQ(ierr); 320cb1e1211SMatthew G Knepley 321cb1e1211SMatthew G Knepley for (field = 0, comp = 0, fieldOffset = 0; field < numFields; ++field) { 322f9fd7fdbSMatthew G. Knepley const PetscInt numQuadPoints = quad.numPoints; 323f9fd7fdbSMatthew G. Knepley const PetscReal *quadPoints = quad.points; 324f9fd7fdbSMatthew G. Knepley const PetscReal *quadWeights = quad.weights; 325c5bbbd5bSMatthew G. Knepley PetscReal *basis; 326c5bbbd5bSMatthew G. Knepley PetscInt numBasisFuncs, numBasisComps, q, d, e, fc, f; 327cb1e1211SMatthew G Knepley 328c5bbbd5bSMatthew G. Knepley ierr = PetscFEGetDimension(fe[field], &numBasisFuncs);CHKERRQ(ierr); 329c5bbbd5bSMatthew G. Knepley ierr = PetscFEGetNumComponents(fe[field], &numBasisComps);CHKERRQ(ierr); 330c5bbbd5bSMatthew G. Knepley ierr = PetscFEGetDefaultTabulation(fe[field], &basis, NULL, NULL);CHKERRQ(ierr); 331cb1e1211SMatthew G Knepley if (debug) { 332cb1e1211SMatthew G Knepley char title[1024]; 333cb1e1211SMatthew G Knepley ierr = PetscSNPrintf(title, 1023, "Solution for Field %d", field);CHKERRQ(ierr); 334cb1e1211SMatthew G Knepley ierr = DMPrintCellVector(c, title, numBasisFuncs*numBasisComps, &x[fieldOffset]);CHKERRQ(ierr); 335cb1e1211SMatthew G Knepley } 336cb1e1211SMatthew G Knepley for (q = 0; q < numQuadPoints; ++q) { 337cb1e1211SMatthew G Knepley for (d = 0; d < dim; d++) { 338cb1e1211SMatthew G Knepley coords[d] = v0[d]; 339cb1e1211SMatthew G Knepley for (e = 0; e < dim; e++) { 340cb1e1211SMatthew G Knepley coords[d] += J[d*dim+e]*(quadPoints[q*dim+e] + 1.0); 341cb1e1211SMatthew G Knepley } 342cb1e1211SMatthew G Knepley } 34372f94c41SMatthew G. Knepley (*funcs[field])(coords, funcVal); 344cb1e1211SMatthew G Knepley for (fc = 0; fc < numBasisComps; ++fc) { 345a1d24da5SMatthew G. Knepley PetscScalar interpolant = 0.0; 346a1d24da5SMatthew G. Knepley 347cb1e1211SMatthew G Knepley for (f = 0; f < numBasisFuncs; ++f) { 348cb1e1211SMatthew G Knepley const PetscInt fidx = f*numBasisComps+fc; 349a1d24da5SMatthew G. Knepley interpolant += x[fieldOffset+fidx]*basis[q*numBasisFuncs*numBasisComps+fidx]; 350cb1e1211SMatthew G Knepley } 35172f94c41SMatthew G. Knepley if (debug) {ierr = PetscPrintf(PETSC_COMM_SELF, " elem %d field %d diff %g\n", c, field, PetscSqr(PetscRealPart(interpolant - funcVal[fc]))*quadWeights[q]*detJ);CHKERRQ(ierr);} 35272f94c41SMatthew G. Knepley elemDiff += PetscSqr(PetscRealPart(interpolant - funcVal[fc]))*quadWeights[q]*detJ; 353cb1e1211SMatthew G Knepley } 354cb1e1211SMatthew G Knepley } 355cb1e1211SMatthew G Knepley comp += numBasisComps; 356cb1e1211SMatthew G Knepley fieldOffset += numBasisFuncs*numBasisComps; 357cb1e1211SMatthew G Knepley } 358cb1e1211SMatthew G Knepley ierr = DMPlexVecRestoreClosure(dm, NULL, localX, c, NULL, &x);CHKERRQ(ierr); 359cb1e1211SMatthew G Knepley if (debug) {ierr = PetscPrintf(PETSC_COMM_SELF, " elem %d diff %g\n", c, elemDiff);CHKERRQ(ierr);} 360cb1e1211SMatthew G Knepley localDiff += elemDiff; 361cb1e1211SMatthew G Knepley } 36272f94c41SMatthew G. Knepley ierr = PetscFree5(funcVal,coords,v0,J,invJ);CHKERRQ(ierr); 363cb1e1211SMatthew G Knepley ierr = DMRestoreLocalVector(dm, &localX);CHKERRQ(ierr); 36486a74ee0SMatthew G. Knepley ierr = MPI_Allreduce(&localDiff, diff, 1, MPIU_REAL, MPI_SUM, PetscObjectComm((PetscObject)dm));CHKERRQ(ierr); 365cb1e1211SMatthew G Knepley *diff = PetscSqrtReal(*diff); 366cb1e1211SMatthew G Knepley PetscFunctionReturn(0); 367cb1e1211SMatthew G Knepley } 368cb1e1211SMatthew G Knepley 369a0845e3aSMatthew G. Knepley #if 0 370a0845e3aSMatthew G. Knepley 371cb1e1211SMatthew G Knepley #undef __FUNCT__ 372cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexComputeResidualFEM" 373cb1e1211SMatthew G Knepley PetscErrorCode DMPlexComputeResidualFEM(DM dm, Vec X, Vec F, void *user) 374cb1e1211SMatthew G Knepley { 375cb1e1211SMatthew G Knepley DM_Plex *mesh = (DM_Plex *) dm->data; 3769a559087SMatthew G. Knepley PetscFEM *fem = (PetscFEM *) user; 377cb1e1211SMatthew G Knepley PetscQuadrature *quad = fem->quad; 378652b88e8SMatthew G. Knepley PetscQuadrature *quadBd = fem->quadBd; 379cb1e1211SMatthew G Knepley PetscSection section; 38002a80efeSMatthew G. Knepley PetscReal *v0, *n, *J, *invJ, *detJ; 381cb1e1211SMatthew G Knepley PetscScalar *elemVec, *u; 382cb1e1211SMatthew G Knepley PetscInt dim, numFields, field, numBatchesTmp = 1, numCells, cStart, cEnd, c; 383652b88e8SMatthew G. Knepley PetscInt cellDof, numComponents; 384652b88e8SMatthew G. Knepley PetscBool has; 385cb1e1211SMatthew G Knepley PetscErrorCode ierr; 386cb1e1211SMatthew G Knepley 387cb1e1211SMatthew G Knepley PetscFunctionBegin; 388652b88e8SMatthew G. Knepley if (has && quadBd) { 389652b88e8SMatthew G. Knepley DMLabel label; 390652b88e8SMatthew G. Knepley IS pointIS; 391652b88e8SMatthew G. Knepley const PetscInt *points; 392652b88e8SMatthew G. Knepley PetscInt numPoints, p; 393652b88e8SMatthew G. Knepley 394652b88e8SMatthew G. Knepley ierr = DMPlexGetLabel(dm, "boundary", &label);CHKERRQ(ierr); 395652b88e8SMatthew G. Knepley ierr = DMLabelGetStratumSize(label, 1, &numPoints);CHKERRQ(ierr); 396652b88e8SMatthew G. Knepley ierr = DMLabelGetStratumIS(label, 1, &pointIS);CHKERRQ(ierr); 397652b88e8SMatthew G. Knepley ierr = ISGetIndices(pointIS, &points);CHKERRQ(ierr); 398652b88e8SMatthew G. Knepley for (field = 0, cellDof = 0, numComponents = 0; field < numFields; ++field) { 399652b88e8SMatthew G. Knepley cellDof += quadBd[field].numBasisFuncs*quadBd[field].numComponents; 400652b88e8SMatthew G. Knepley numComponents += quadBd[field].numComponents; 401652b88e8SMatthew G. Knepley } 402dcca6d9dSJed Brown ierr = PetscMalloc7(numPoints*cellDof,&u,numPoints*dim,&v0,numPoints*dim,&n,numPoints*dim*dim,&J,numPoints*dim*dim,&invJ,numPoints,&detJ,numPoints*cellDof,&elemVec);CHKERRQ(ierr); 403652b88e8SMatthew G. Knepley for (p = 0; p < numPoints; ++p) { 404652b88e8SMatthew G. Knepley const PetscInt point = points[p]; 405652b88e8SMatthew G. Knepley PetscScalar *x; 406652b88e8SMatthew G. Knepley PetscInt i; 407652b88e8SMatthew G. Knepley 40802a80efeSMatthew G. Knepley /* TODO: Add normal determination here */ 409652b88e8SMatthew G. Knepley ierr = DMPlexComputeCellGeometry(dm, point, &v0[p*dim], &J[p*dim*dim], &invJ[p*dim*dim], &detJ[p]);CHKERRQ(ierr); 4101d930511SMatthew G. Knepley if (detJ[p] <= 0.0) SETERRQ2(PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Invalid determinant %g for face %d", detJ[p], point); 411652b88e8SMatthew G. Knepley ierr = DMPlexVecGetClosure(dm, NULL, X, point, NULL, &x);CHKERRQ(ierr); 412652b88e8SMatthew G. Knepley 413652b88e8SMatthew G. Knepley for (i = 0; i < cellDof; ++i) u[p*cellDof+i] = x[i]; 414652b88e8SMatthew G. Knepley ierr = DMPlexVecRestoreClosure(dm, NULL, X, point, NULL, &x);CHKERRQ(ierr); 415652b88e8SMatthew G. Knepley } 416652b88e8SMatthew G. Knepley for (field = 0; field < numFields; ++field) { 417652b88e8SMatthew G. Knepley const PetscInt numQuadPoints = quadBd[field].numQuadPoints; 418652b88e8SMatthew G. Knepley const PetscInt numBasisFuncs = quadBd[field].numBasisFuncs; 419a9dc2124SMatthew G. Knepley void (*f0)(const PetscScalar[], const PetscScalar[], const PetscReal[], const PetscReal[], PetscScalar[]) = fem->f0BdFuncs[field]; 420a9dc2124SMatthew G. Knepley void (*f1)(const PetscScalar[], const PetscScalar[], const PetscReal[], const PetscReal[], PetscScalar[]) = fem->f1BdFuncs[field]; 421652b88e8SMatthew G. Knepley /* Conforming batches */ 422652b88e8SMatthew G. Knepley PetscInt blockSize = numBasisFuncs*numQuadPoints; 423652b88e8SMatthew G. Knepley PetscInt numBlocks = 1; 424652b88e8SMatthew G. Knepley PetscInt batchSize = numBlocks * blockSize; 425652b88e8SMatthew G. Knepley PetscInt numBatches = numBatchesTmp; 426652b88e8SMatthew G. Knepley PetscInt numChunks = numPoints / (numBatches*batchSize); 427652b88e8SMatthew G. Knepley /* Remainder */ 428652b88e8SMatthew G. Knepley PetscInt numRemainder = numPoints % (numBatches * batchSize); 429652b88e8SMatthew G. Knepley PetscInt offset = numPoints - numRemainder; 430652b88e8SMatthew G. Knepley 43102a80efeSMatthew G. Knepley ierr = (*mesh->integrateBdResidualFEM)(numChunks*numBatches*batchSize, numFields, field, quadBd, u, v0, n, J, invJ, detJ, f0, f1, elemVec);CHKERRQ(ierr); 43202a80efeSMatthew G. Knepley ierr = (*mesh->integrateBdResidualFEM)(numRemainder, numFields, field, quadBd, &u[offset*cellDof], &v0[offset*dim], &n[offset*dim], &J[offset*dim*dim], &invJ[offset*dim*dim], &detJ[offset], 433652b88e8SMatthew G. Knepley f0, f1, &elemVec[offset*cellDof]);CHKERRQ(ierr); 434652b88e8SMatthew G. Knepley } 435652b88e8SMatthew G. Knepley for (p = 0; p < numPoints; ++p) { 436652b88e8SMatthew G. Knepley const PetscInt point = points[p]; 437652b88e8SMatthew G. Knepley 438652b88e8SMatthew G. Knepley if (mesh->printFEM > 1) {ierr = DMPrintCellVector(point, "Residual", cellDof, &elemVec[p*cellDof]);CHKERRQ(ierr);} 439652b88e8SMatthew G. Knepley ierr = DMPlexVecSetClosure(dm, NULL, F, point, &elemVec[p*cellDof], ADD_VALUES);CHKERRQ(ierr); 440652b88e8SMatthew G. Knepley } 441652b88e8SMatthew G. Knepley ierr = ISRestoreIndices(pointIS, &points);CHKERRQ(ierr); 442652b88e8SMatthew G. Knepley ierr = ISDestroy(&pointIS);CHKERRQ(ierr); 44302a80efeSMatthew G. Knepley ierr = PetscFree7(u,v0,n,J,invJ,detJ,elemVec);CHKERRQ(ierr); 444652b88e8SMatthew G. Knepley } 445cb1e1211SMatthew G Knepley PetscFunctionReturn(0); 446cb1e1211SMatthew G Knepley } 447cb1e1211SMatthew G Knepley 448a0845e3aSMatthew G. Knepley #else 449a0845e3aSMatthew G. Knepley 450a0845e3aSMatthew G. Knepley #undef __FUNCT__ 451a0845e3aSMatthew G. Knepley #define __FUNCT__ "DMPlexComputeResidualFEM" 452a0845e3aSMatthew G. Knepley /*@ 453a0845e3aSMatthew G. Knepley DMPlexComputeResidualFEM - Form the local residual F from the local input X using pointwise functions specified by the user 454a0845e3aSMatthew G. Knepley 455a0845e3aSMatthew G. Knepley Input Parameters: 456a0845e3aSMatthew G. Knepley + dm - The mesh 457a0845e3aSMatthew G. Knepley . X - Local input vector 458a0845e3aSMatthew G. Knepley - user - The user context 459a0845e3aSMatthew G. Knepley 460a0845e3aSMatthew G. Knepley Output Parameter: 461a0845e3aSMatthew G. Knepley . F - Local output vector 462a0845e3aSMatthew G. Knepley 463a0845e3aSMatthew G. Knepley Note: 464a0845e3aSMatthew G. Knepley The second member of the user context must be an FEMContext. 465a0845e3aSMatthew G. Knepley 466a0845e3aSMatthew G. Knepley We form the residual one batch of elements at a time. This allows us to offload work onto an accelerator, 467a0845e3aSMatthew G. Knepley like a GPU, or vectorize on a multicore machine. 468a0845e3aSMatthew G. Knepley 469a0845e3aSMatthew G. Knepley Level: developer 470a0845e3aSMatthew G. Knepley 471a0845e3aSMatthew G. Knepley .seealso: DMPlexComputeJacobianActionFEM() 472a0845e3aSMatthew G. Knepley @*/ 473a0845e3aSMatthew G. Knepley PetscErrorCode DMPlexComputeResidualFEM(DM dm, Vec X, Vec F, void *user) 474a0845e3aSMatthew G. Knepley { 475a0845e3aSMatthew G. Knepley DM_Plex *mesh = (DM_Plex *) dm->data; 4769a559087SMatthew G. Knepley PetscFEM *fem = (PetscFEM *) user; 477a0845e3aSMatthew G. Knepley PetscFE *fe = fem->fe; 4789a559087SMatthew G. Knepley PetscFE *feAux = fem->feAux; 479f1ea0e2fSMatthew G. Knepley PetscFE *feBd = fem->feBd; 480a0845e3aSMatthew G. Knepley const char *name = "Residual"; 4819a559087SMatthew G. Knepley DM dmAux; 4829a559087SMatthew G. Knepley Vec A; 483a0845e3aSMatthew G. Knepley PetscQuadrature q; 484a0845e3aSMatthew G. Knepley PetscCellGeometry geom; 4859a559087SMatthew G. Knepley PetscSection section, sectionAux; 486a0845e3aSMatthew G. Knepley PetscReal *v0, *J, *invJ, *detJ; 4879a559087SMatthew G. Knepley PetscScalar *elemVec, *u, *a; 4889a559087SMatthew G. Knepley PetscInt dim, Nf, NfAux = 0, f, numCells, cStart, cEnd, c; 489a0845e3aSMatthew G. Knepley PetscInt cellDof = 0, numComponents = 0; 4909a559087SMatthew G. Knepley PetscInt cellDofAux = 0, numComponentsAux = 0; 491a0845e3aSMatthew G. Knepley PetscErrorCode ierr; 492a0845e3aSMatthew G. Knepley 493a0845e3aSMatthew G. Knepley PetscFunctionBegin; 494a0845e3aSMatthew G. Knepley ierr = PetscLogEventBegin(DMPLEX_ResidualFEM,dm,0,0,0);CHKERRQ(ierr); 495a0845e3aSMatthew G. Knepley ierr = DMPlexGetDimension(dm, &dim);CHKERRQ(ierr); 496a0845e3aSMatthew G. Knepley ierr = DMGetDefaultSection(dm, §ion);CHKERRQ(ierr); 4979a559087SMatthew G. Knepley ierr = PetscSectionGetNumFields(section, &Nf);CHKERRQ(ierr); 498a0845e3aSMatthew G. Knepley ierr = DMPlexGetHeightStratum(dm, 0, &cStart, &cEnd);CHKERRQ(ierr); 499a0845e3aSMatthew G. Knepley numCells = cEnd - cStart; 5009a559087SMatthew G. Knepley for (f = 0; f < Nf; ++f) { 501a0845e3aSMatthew G. Knepley PetscInt Nb, Nc; 502a0845e3aSMatthew G. Knepley 503a0845e3aSMatthew G. Knepley ierr = PetscFEGetDimension(fe[f], &Nb);CHKERRQ(ierr); 504a0845e3aSMatthew G. Knepley ierr = PetscFEGetNumComponents(fe[f], &Nc);CHKERRQ(ierr); 505a0845e3aSMatthew G. Knepley cellDof += Nb*Nc; 506a0845e3aSMatthew G. Knepley numComponents += Nc; 507a0845e3aSMatthew G. Knepley } 5089a559087SMatthew G. Knepley ierr = PetscObjectQuery((PetscObject) dm, "dmAux", (PetscObject *) &dmAux);CHKERRQ(ierr); 5099a559087SMatthew G. Knepley ierr = PetscObjectQuery((PetscObject) dm, "A", (PetscObject *) &A);CHKERRQ(ierr); 5109a559087SMatthew G. Knepley if (dmAux) { 5119a559087SMatthew G. Knepley ierr = DMGetDefaultSection(dmAux, §ionAux);CHKERRQ(ierr); 5129a559087SMatthew G. Knepley ierr = PetscSectionGetNumFields(sectionAux, &NfAux);CHKERRQ(ierr); 5139a559087SMatthew G. Knepley } 5149a559087SMatthew G. Knepley for (f = 0; f < NfAux; ++f) { 5159a559087SMatthew G. Knepley PetscInt Nb, Nc; 5169a559087SMatthew G. Knepley 5179a559087SMatthew G. Knepley ierr = PetscFEGetDimension(feAux[f], &Nb);CHKERRQ(ierr); 5189a559087SMatthew G. Knepley ierr = PetscFEGetNumComponents(feAux[f], &Nc);CHKERRQ(ierr); 5199a559087SMatthew G. Knepley cellDofAux += Nb*Nc; 5209a559087SMatthew G. Knepley numComponentsAux += Nc; 5219a559087SMatthew G. Knepley } 52272f94c41SMatthew G. Knepley ierr = DMPlexProjectFunctionLocal(dm, fe, fem->bcFuncs, INSERT_BC_VALUES, X);CHKERRQ(ierr); 523a0845e3aSMatthew G. Knepley ierr = VecSet(F, 0.0);CHKERRQ(ierr); 524dcca6d9dSJed Brown ierr = PetscMalloc6(numCells*cellDof,&u,numCells*dim,&v0,numCells*dim*dim,&J,numCells*dim*dim,&invJ,numCells,&detJ,numCells*cellDof,&elemVec);CHKERRQ(ierr); 525785e854fSJed Brown if (dmAux) {ierr = PetscMalloc1(numCells*cellDofAux, &a);CHKERRQ(ierr);} 526a0845e3aSMatthew G. Knepley for (c = cStart; c < cEnd; ++c) { 527a0845e3aSMatthew G. Knepley PetscScalar *x = NULL; 528a0845e3aSMatthew G. Knepley PetscInt i; 529a0845e3aSMatthew G. Knepley 530a0845e3aSMatthew G. Knepley ierr = DMPlexComputeCellGeometry(dm, c, &v0[c*dim], &J[c*dim*dim], &invJ[c*dim*dim], &detJ[c]);CHKERRQ(ierr); 531a0845e3aSMatthew G. Knepley if (detJ[c] <= 0.0) SETERRQ2(PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Invalid determinant %g for element %d", detJ[c], c); 532a0845e3aSMatthew G. Knepley ierr = DMPlexVecGetClosure(dm, section, X, c, NULL, &x);CHKERRQ(ierr); 533a0845e3aSMatthew G. Knepley for (i = 0; i < cellDof; ++i) u[c*cellDof+i] = x[i]; 534a0845e3aSMatthew G. Knepley ierr = DMPlexVecRestoreClosure(dm, section, X, c, NULL, &x);CHKERRQ(ierr); 5359a559087SMatthew G. Knepley if (dmAux) { 5369a559087SMatthew G. Knepley ierr = DMPlexVecGetClosure(dmAux, sectionAux, A, c, NULL, &x);CHKERRQ(ierr); 5379a559087SMatthew G. Knepley for (i = 0; i < cellDofAux; ++i) a[c*cellDofAux+i] = x[i]; 5389a559087SMatthew G. Knepley ierr = DMPlexVecRestoreClosure(dmAux, sectionAux, A, c, NULL, &x);CHKERRQ(ierr); 539a0845e3aSMatthew G. Knepley } 5409a559087SMatthew G. Knepley } 5419a559087SMatthew G. Knepley for (f = 0; f < Nf; ++f) { 542c012ea0aSMatthew G. Knepley void (*f0)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], PetscScalar[]) = fem->f0Funcs[f]; 543c012ea0aSMatthew G. Knepley void (*f1)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], PetscScalar[]) = fem->f1Funcs[f]; 544a0845e3aSMatthew G. Knepley PetscInt Nb; 545a0845e3aSMatthew G. Knepley /* Conforming batches */ 546f30c5766SMatthew G. Knepley PetscInt numChunks, numBatches, numBlocks, Ne, blockSize, batchSize; 547a0845e3aSMatthew G. Knepley /* Remainder */ 548a0845e3aSMatthew G. Knepley PetscInt Nr, offset; 549a0845e3aSMatthew G. Knepley 550a0845e3aSMatthew G. Knepley ierr = PetscFEGetQuadrature(fe[f], &q);CHKERRQ(ierr); 551a0845e3aSMatthew G. Knepley ierr = PetscFEGetDimension(fe[f], &Nb);CHKERRQ(ierr); 552f30c5766SMatthew G. Knepley ierr = PetscFEGetTileSizes(fe[f], NULL, &numBlocks, NULL, &numBatches);CHKERRQ(ierr); 553f9fd7fdbSMatthew G. Knepley blockSize = Nb*q.numPoints; 554a0845e3aSMatthew G. Knepley batchSize = numBlocks * blockSize; 555f30c5766SMatthew G. Knepley ierr = PetscFESetTileSizes(fe[f], blockSize, numBlocks, batchSize, numBatches);CHKERRQ(ierr); 556a0845e3aSMatthew G. Knepley numChunks = numCells / (numBatches*batchSize); 557a0845e3aSMatthew G. Knepley Ne = numChunks*numBatches*batchSize; 558a0845e3aSMatthew G. Knepley Nr = numCells % (numBatches*batchSize); 559a0845e3aSMatthew G. Knepley offset = numCells - Nr; 560a0845e3aSMatthew G. Knepley geom.v0 = v0; 561a0845e3aSMatthew G. Knepley geom.J = J; 562a0845e3aSMatthew G. Knepley geom.invJ = invJ; 563a0845e3aSMatthew G. Knepley geom.detJ = detJ; 5649a559087SMatthew G. Knepley ierr = PetscFEIntegrateResidual(fe[f], Ne, Nf, fe, f, geom, u, NfAux, feAux, a, f0, f1, elemVec);CHKERRQ(ierr); 565a0845e3aSMatthew G. Knepley geom.v0 = &v0[offset*dim]; 566a0845e3aSMatthew G. Knepley geom.J = &J[offset*dim*dim]; 567a0845e3aSMatthew G. Knepley geom.invJ = &invJ[offset*dim*dim]; 568a0845e3aSMatthew G. Knepley geom.detJ = &detJ[offset]; 5699a559087SMatthew G. Knepley ierr = PetscFEIntegrateResidual(fe[f], Nr, Nf, fe, f, geom, &u[offset*cellDof], NfAux, feAux, &a[offset*cellDofAux], f0, f1, &elemVec[offset*cellDof]);CHKERRQ(ierr); 570a0845e3aSMatthew G. Knepley } 571a0845e3aSMatthew G. Knepley for (c = cStart; c < cEnd; ++c) { 572a0845e3aSMatthew G. Knepley if (mesh->printFEM > 1) {ierr = DMPrintCellVector(c, name, cellDof, &elemVec[c*cellDof]);CHKERRQ(ierr);} 573a0845e3aSMatthew G. Knepley ierr = DMPlexVecSetClosure(dm, section, F, c, &elemVec[c*cellDof], ADD_VALUES);CHKERRQ(ierr); 574a0845e3aSMatthew G. Knepley } 575a0845e3aSMatthew G. Knepley ierr = PetscFree6(u,v0,J,invJ,detJ,elemVec);CHKERRQ(ierr); 5769a559087SMatthew G. Knepley if (dmAux) {ierr = PetscFree(a);CHKERRQ(ierr);} 577f1ea0e2fSMatthew G. Knepley if (feBd) { 578075da914SMatthew G. Knepley DMLabel label, depth; 579f1ea0e2fSMatthew G. Knepley IS pointIS; 580f1ea0e2fSMatthew G. Knepley const PetscInt *points; 581075da914SMatthew G. Knepley PetscInt dep, numPoints, p, numFaces; 582f1ea0e2fSMatthew G. Knepley PetscReal *n; 583f1ea0e2fSMatthew G. Knepley 584f1ea0e2fSMatthew G. Knepley ierr = DMPlexGetLabel(dm, "boundary", &label);CHKERRQ(ierr); 585075da914SMatthew G. Knepley ierr = DMPlexGetDepthLabel(dm, &depth);CHKERRQ(ierr); 586f1ea0e2fSMatthew G. Knepley ierr = DMLabelGetStratumSize(label, 1, &numPoints);CHKERRQ(ierr); 587f1ea0e2fSMatthew G. Knepley ierr = DMLabelGetStratumIS(label, 1, &pointIS);CHKERRQ(ierr); 588f1ea0e2fSMatthew G. Knepley ierr = ISGetIndices(pointIS, &points);CHKERRQ(ierr); 589f1ea0e2fSMatthew G. Knepley for (f = 0, cellDof = 0, numComponents = 0; f < Nf; ++f) { 590f1ea0e2fSMatthew G. Knepley PetscInt Nb, Nc; 591f1ea0e2fSMatthew G. Knepley 592f1ea0e2fSMatthew G. Knepley ierr = PetscFEGetDimension(feBd[f], &Nb);CHKERRQ(ierr); 593f1ea0e2fSMatthew G. Knepley ierr = PetscFEGetNumComponents(feBd[f], &Nc);CHKERRQ(ierr); 594f1ea0e2fSMatthew G. Knepley cellDof += Nb*Nc; 595f1ea0e2fSMatthew G. Knepley numComponents += Nc; 596f1ea0e2fSMatthew G. Knepley } 597075da914SMatthew G. Knepley for (p = 0, numFaces = 0; p < numPoints; ++p) { 598075da914SMatthew G. Knepley ierr = DMLabelGetValue(depth, points[p], &dep);CHKERRQ(ierr); 599075da914SMatthew G. Knepley if (dep == dim-1) ++numFaces; 600075da914SMatthew G. Knepley } 601dcca6d9dSJed Brown ierr = PetscMalloc7(numFaces*cellDof,&u,numFaces*dim,&v0,numFaces*dim,&n,numFaces*dim*dim,&J,numFaces*dim*dim,&invJ,numFaces,&detJ,numFaces*cellDof,&elemVec);CHKERRQ(ierr); 602075da914SMatthew G. Knepley for (p = 0, f = 0; p < numPoints; ++p) { 603f1ea0e2fSMatthew G. Knepley const PetscInt point = points[p]; 604f1ea0e2fSMatthew G. Knepley PetscScalar *x = NULL; 605f1ea0e2fSMatthew G. Knepley PetscInt i; 606f1ea0e2fSMatthew G. Knepley 607075da914SMatthew G. Knepley ierr = DMLabelGetValue(depth, points[p], &dep);CHKERRQ(ierr); 608075da914SMatthew G. Knepley if (dep != dim-1) continue; 609075da914SMatthew G. Knepley ierr = DMPlexComputeCellGeometry(dm, point, &v0[f*dim], &J[f*dim*dim], &invJ[f*dim*dim], &detJ[f]);CHKERRQ(ierr); 610a8007bbfSMatthew G. Knepley ierr = DMPlexComputeCellGeometryFVM(dm, point, NULL, NULL, &n[f*dim]); 611075da914SMatthew G. Knepley if (detJ[f] <= 0.0) SETERRQ2(PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Invalid determinant %g for face %d", detJ[f], point); 612f1ea0e2fSMatthew G. Knepley ierr = DMPlexVecGetClosure(dm, section, X, point, NULL, &x);CHKERRQ(ierr); 613075da914SMatthew G. Knepley for (i = 0; i < cellDof; ++i) u[f*cellDof+i] = x[i]; 614f1ea0e2fSMatthew G. Knepley ierr = DMPlexVecRestoreClosure(dm, section, X, point, NULL, &x);CHKERRQ(ierr); 615075da914SMatthew G. Knepley ++f; 616f1ea0e2fSMatthew G. Knepley } 617f1ea0e2fSMatthew G. Knepley for (f = 0; f < Nf; ++f) { 618f1ea0e2fSMatthew G. Knepley void (*f0)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], const PetscReal[], PetscScalar[]) = fem->f0BdFuncs[f]; 619f1ea0e2fSMatthew G. Knepley void (*f1)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], const PetscReal[], PetscScalar[]) = fem->f1BdFuncs[f]; 620f1ea0e2fSMatthew G. Knepley PetscInt Nb; 621f1ea0e2fSMatthew G. Knepley /* Conforming batches */ 622f1ea0e2fSMatthew G. Knepley PetscInt numChunks, numBatches, numBlocks, Ne, blockSize, batchSize; 623f1ea0e2fSMatthew G. Knepley /* Remainder */ 624f1ea0e2fSMatthew G. Knepley PetscInt Nr, offset; 625f1ea0e2fSMatthew G. Knepley 626f1ea0e2fSMatthew G. Knepley ierr = PetscFEGetQuadrature(feBd[f], &q);CHKERRQ(ierr); 627f1ea0e2fSMatthew G. Knepley ierr = PetscFEGetDimension(feBd[f], &Nb);CHKERRQ(ierr); 628f1ea0e2fSMatthew G. Knepley ierr = PetscFEGetTileSizes(feBd[f], NULL, &numBlocks, NULL, &numBatches);CHKERRQ(ierr); 629f9fd7fdbSMatthew G. Knepley blockSize = Nb*q.numPoints; 630f1ea0e2fSMatthew G. Knepley batchSize = numBlocks * blockSize; 631f1ea0e2fSMatthew G. Knepley ierr = PetscFESetTileSizes(feBd[f], blockSize, numBlocks, batchSize, numBatches);CHKERRQ(ierr); 632075da914SMatthew G. Knepley numChunks = numFaces / (numBatches*batchSize); 633f1ea0e2fSMatthew G. Knepley Ne = numChunks*numBatches*batchSize; 634075da914SMatthew G. Knepley Nr = numFaces % (numBatches*batchSize); 635075da914SMatthew G. Knepley offset = numFaces - Nr; 636f1ea0e2fSMatthew G. Knepley geom.v0 = v0; 637f1ea0e2fSMatthew G. Knepley geom.n = n; 638f1ea0e2fSMatthew G. Knepley geom.J = J; 639f1ea0e2fSMatthew G. Knepley geom.invJ = invJ; 640f1ea0e2fSMatthew G. Knepley geom.detJ = detJ; 641f1ea0e2fSMatthew G. Knepley ierr = PetscFEIntegrateBdResidual(feBd[f], Ne, Nf, feBd, f, geom, u, 0, NULL, NULL, f0, f1, elemVec);CHKERRQ(ierr); 642f1ea0e2fSMatthew G. Knepley geom.v0 = &v0[offset*dim]; 643f1ea0e2fSMatthew G. Knepley geom.n = &n[offset*dim]; 644f1ea0e2fSMatthew G. Knepley geom.J = &J[offset*dim*dim]; 645f1ea0e2fSMatthew G. Knepley geom.invJ = &invJ[offset*dim*dim]; 646f1ea0e2fSMatthew G. Knepley geom.detJ = &detJ[offset]; 647f1ea0e2fSMatthew G. Knepley ierr = PetscFEIntegrateBdResidual(feBd[f], Nr, Nf, feBd, f, geom, &u[offset*cellDof], 0, NULL, NULL, f0, f1, &elemVec[offset*cellDof]);CHKERRQ(ierr); 648f1ea0e2fSMatthew G. Knepley } 649075da914SMatthew G. Knepley for (p = 0, f = 0; p < numPoints; ++p) { 650f1ea0e2fSMatthew G. Knepley const PetscInt point = points[p]; 651f1ea0e2fSMatthew G. Knepley 652075da914SMatthew G. Knepley ierr = DMLabelGetValue(depth, point, &dep);CHKERRQ(ierr); 653075da914SMatthew G. Knepley if (dep != dim-1) continue; 654075da914SMatthew G. Knepley if (mesh->printFEM > 1) {ierr = DMPrintCellVector(point, "BdResidual", cellDof, &elemVec[f*cellDof]);CHKERRQ(ierr);} 655075da914SMatthew G. Knepley ierr = DMPlexVecSetClosure(dm, NULL, F, point, &elemVec[f*cellDof], ADD_VALUES);CHKERRQ(ierr); 656075da914SMatthew G. Knepley ++f; 657f1ea0e2fSMatthew G. Knepley } 658f1ea0e2fSMatthew G. Knepley ierr = ISRestoreIndices(pointIS, &points);CHKERRQ(ierr); 659f1ea0e2fSMatthew G. Knepley ierr = ISDestroy(&pointIS);CHKERRQ(ierr); 660f1ea0e2fSMatthew G. Knepley ierr = PetscFree7(u,v0,n,J,invJ,detJ,elemVec);CHKERRQ(ierr); 661f1ea0e2fSMatthew G. Knepley } 6626113b454SMatthew G. Knepley if (mesh->printFEM) {ierr = DMPrintLocalVec(dm, name, mesh->printTol, F);CHKERRQ(ierr);} 663a0845e3aSMatthew G. Knepley ierr = PetscLogEventEnd(DMPLEX_ResidualFEM,dm,0,0,0);CHKERRQ(ierr); 664a0845e3aSMatthew G. Knepley PetscFunctionReturn(0); 665a0845e3aSMatthew G. Knepley } 666a0845e3aSMatthew G. Knepley 667a0845e3aSMatthew G. Knepley #endif 668a0845e3aSMatthew G. Knepley 669cb1e1211SMatthew G Knepley #undef __FUNCT__ 670cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexComputeJacobianActionFEM" 671cb1e1211SMatthew G Knepley /*@C 672cb1e1211SMatthew G Knepley DMPlexComputeJacobianActionFEM - Form the local action of Jacobian J(u) on the local input X using pointwise functions specified by the user 673cb1e1211SMatthew G Knepley 674cb1e1211SMatthew G Knepley Input Parameters: 675cb1e1211SMatthew G Knepley + dm - The mesh 676cb1e1211SMatthew G Knepley . J - The Jacobian shell matrix 677cb1e1211SMatthew G Knepley . X - Local input vector 678cb1e1211SMatthew G Knepley - user - The user context 679cb1e1211SMatthew G Knepley 680cb1e1211SMatthew G Knepley Output Parameter: 681cb1e1211SMatthew G Knepley . F - Local output vector 682cb1e1211SMatthew G Knepley 683cb1e1211SMatthew G Knepley Note: 684cb1e1211SMatthew G Knepley The second member of the user context must be an FEMContext. 685cb1e1211SMatthew G Knepley 686cb1e1211SMatthew G Knepley We form the residual one batch of elements at a time. This allows us to offload work onto an accelerator, 687cb1e1211SMatthew G Knepley like a GPU, or vectorize on a multicore machine. 688cb1e1211SMatthew G Knepley 6890059ad2aSSatish Balay Level: developer 6900059ad2aSSatish Balay 691cb1e1211SMatthew G Knepley .seealso: DMPlexComputeResidualFEM() 692878cb397SSatish Balay @*/ 693cb1e1211SMatthew G Knepley PetscErrorCode DMPlexComputeJacobianActionFEM(DM dm, Mat Jac, Vec X, Vec F, void *user) 694cb1e1211SMatthew G Knepley { 695cb1e1211SMatthew G Knepley DM_Plex *mesh = (DM_Plex *) dm->data; 6969a559087SMatthew G. Knepley PetscFEM *fem = (PetscFEM *) user; 6970483ade4SMatthew G. Knepley PetscFE *fe = fem->fe; 6980483ade4SMatthew G. Knepley PetscQuadrature quad; 6990483ade4SMatthew G. Knepley PetscCellGeometry geom; 700cb1e1211SMatthew G Knepley PetscSection section; 701cb1e1211SMatthew G Knepley JacActionCtx *jctx; 702cb1e1211SMatthew G Knepley PetscReal *v0, *J, *invJ, *detJ; 703cb1e1211SMatthew G Knepley PetscScalar *elemVec, *u, *a; 7040483ade4SMatthew G. Knepley PetscInt dim, numFields, field, numCells, cStart, cEnd, c; 705cb1e1211SMatthew G Knepley PetscInt cellDof = 0; 706cb1e1211SMatthew G Knepley PetscErrorCode ierr; 707cb1e1211SMatthew G Knepley 708cb1e1211SMatthew G Knepley PetscFunctionBegin; 7090483ade4SMatthew G. Knepley /* ierr = PetscLogEventBegin(DMPLEX_JacobianActionFEM,dm,0,0,0);CHKERRQ(ierr); */ 710cb1e1211SMatthew G Knepley ierr = MatShellGetContext(Jac, &jctx);CHKERRQ(ierr); 711cb1e1211SMatthew G Knepley ierr = DMPlexGetDimension(dm, &dim);CHKERRQ(ierr); 712cb1e1211SMatthew G Knepley ierr = DMGetDefaultSection(dm, §ion);CHKERRQ(ierr); 713cb1e1211SMatthew G Knepley ierr = PetscSectionGetNumFields(section, &numFields);CHKERRQ(ierr); 714cb1e1211SMatthew G Knepley ierr = DMPlexGetHeightStratum(dm, 0, &cStart, &cEnd);CHKERRQ(ierr); 715cb1e1211SMatthew G Knepley numCells = cEnd - cStart; 716cb1e1211SMatthew G Knepley for (field = 0; field < numFields; ++field) { 7170483ade4SMatthew G. Knepley PetscInt Nb, Nc; 7180483ade4SMatthew G. Knepley 7190483ade4SMatthew G. Knepley ierr = PetscFEGetDimension(fe[field], &Nb);CHKERRQ(ierr); 7200483ade4SMatthew G. Knepley ierr = PetscFEGetNumComponents(fe[field], &Nc);CHKERRQ(ierr); 7210483ade4SMatthew G. Knepley cellDof += Nb*Nc; 722cb1e1211SMatthew G Knepley } 723cb1e1211SMatthew G Knepley ierr = VecSet(F, 0.0);CHKERRQ(ierr); 724dcca6d9dSJed Brown ierr = PetscMalloc7(numCells*cellDof,&u,numCells*cellDof,&a,numCells*dim,&v0,numCells*dim*dim,&J,numCells*dim*dim,&invJ,numCells,&detJ,numCells*cellDof,&elemVec);CHKERRQ(ierr); 725cb1e1211SMatthew G Knepley for (c = cStart; c < cEnd; ++c) { 726a1e44745SMatthew G. Knepley PetscScalar *x = NULL; 727cb1e1211SMatthew G Knepley PetscInt i; 728cb1e1211SMatthew G Knepley 729cb1e1211SMatthew G Knepley ierr = DMPlexComputeCellGeometry(dm, c, &v0[c*dim], &J[c*dim*dim], &invJ[c*dim*dim], &detJ[c]);CHKERRQ(ierr); 730cb1e1211SMatthew G Knepley if (detJ[c] <= 0.0) SETERRQ2(PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Invalid determinant %g for element %d", detJ[c], c); 731cb1e1211SMatthew G Knepley ierr = DMPlexVecGetClosure(dm, NULL, jctx->u, c, NULL, &x);CHKERRQ(ierr); 732cb1e1211SMatthew G Knepley for (i = 0; i < cellDof; ++i) u[c*cellDof+i] = x[i]; 733cb1e1211SMatthew G Knepley ierr = DMPlexVecRestoreClosure(dm, NULL, jctx->u, c, NULL, &x);CHKERRQ(ierr); 734cb1e1211SMatthew G Knepley ierr = DMPlexVecGetClosure(dm, NULL, X, c, NULL, &x);CHKERRQ(ierr); 735cb1e1211SMatthew G Knepley for (i = 0; i < cellDof; ++i) a[c*cellDof+i] = x[i]; 736cb1e1211SMatthew G Knepley ierr = DMPlexVecRestoreClosure(dm, NULL, X, c, NULL, &x);CHKERRQ(ierr); 737cb1e1211SMatthew G Knepley } 738cb1e1211SMatthew G Knepley for (field = 0; field < numFields; ++field) { 7390483ade4SMatthew G. Knepley PetscInt Nb; 740cb1e1211SMatthew G Knepley /* Conforming batches */ 741cb1e1211SMatthew G Knepley PetscInt numBlocks = 1; 7420483ade4SMatthew G. Knepley PetscInt numBatches = 1; 7430483ade4SMatthew G. Knepley PetscInt numChunks, Ne, blockSize, batchSize; 744cb1e1211SMatthew G Knepley /* Remainder */ 7450483ade4SMatthew G. Knepley PetscInt Nr, offset; 746cb1e1211SMatthew G Knepley 7470483ade4SMatthew G. Knepley ierr = PetscFEGetQuadrature(fe[field], &quad);CHKERRQ(ierr); 7480483ade4SMatthew G. Knepley ierr = PetscFEGetDimension(fe[field], &Nb);CHKERRQ(ierr); 749f9fd7fdbSMatthew G. Knepley blockSize = Nb*quad.numPoints; 7500483ade4SMatthew G. Knepley batchSize = numBlocks * blockSize; 7510483ade4SMatthew G. Knepley numChunks = numCells / (numBatches*batchSize); 7520483ade4SMatthew G. Knepley Ne = numChunks*numBatches*batchSize; 7530483ade4SMatthew G. Knepley Nr = numCells % (numBatches*batchSize); 7540483ade4SMatthew G. Knepley offset = numCells - Nr; 7550483ade4SMatthew G. Knepley geom.v0 = v0; 7560483ade4SMatthew G. Knepley geom.J = J; 7570483ade4SMatthew G. Knepley geom.invJ = invJ; 7580483ade4SMatthew G. Knepley geom.detJ = detJ; 7590483ade4SMatthew G. Knepley ierr = PetscFEIntegrateJacobianAction(fe[field], Ne, numFields, fe, field, geom, u, a, fem->g0Funcs, fem->g1Funcs, fem->g2Funcs, fem->g3Funcs, elemVec);CHKERRQ(ierr); 7600483ade4SMatthew G. Knepley geom.v0 = &v0[offset*dim]; 7610483ade4SMatthew G. Knepley geom.J = &J[offset*dim*dim]; 7620483ade4SMatthew G. Knepley geom.invJ = &invJ[offset*dim*dim]; 7630483ade4SMatthew G. Knepley geom.detJ = &detJ[offset]; 7640483ade4SMatthew G. Knepley ierr = PetscFEIntegrateJacobianAction(fe[field], Nr, numFields, fe, field, geom, &u[offset*cellDof], &a[offset*cellDof], 765cb1e1211SMatthew G Knepley fem->g0Funcs, fem->g1Funcs, fem->g2Funcs, fem->g3Funcs, &elemVec[offset*cellDof]);CHKERRQ(ierr); 766cb1e1211SMatthew G Knepley } 767cb1e1211SMatthew G Knepley for (c = cStart; c < cEnd; ++c) { 768cb1e1211SMatthew G Knepley if (mesh->printFEM > 1) {ierr = DMPrintCellVector(c, "Jacobian Action", cellDof, &elemVec[c*cellDof]);CHKERRQ(ierr);} 769cb1e1211SMatthew G Knepley ierr = DMPlexVecSetClosure(dm, NULL, F, c, &elemVec[c*cellDof], ADD_VALUES);CHKERRQ(ierr); 770cb1e1211SMatthew G Knepley } 771cb1e1211SMatthew G Knepley ierr = PetscFree7(u,a,v0,J,invJ,detJ,elemVec);CHKERRQ(ierr); 772cb1e1211SMatthew G Knepley if (mesh->printFEM) { 773cb1e1211SMatthew G Knepley PetscMPIInt rank, numProcs; 774cb1e1211SMatthew G Knepley PetscInt p; 775cb1e1211SMatthew G Knepley 776cb1e1211SMatthew G Knepley ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)dm), &rank);CHKERRQ(ierr); 777cb1e1211SMatthew G Knepley ierr = MPI_Comm_size(PetscObjectComm((PetscObject)dm), &numProcs);CHKERRQ(ierr); 77886a74ee0SMatthew G. Knepley ierr = PetscPrintf(PetscObjectComm((PetscObject)dm), "Jacobian Action:\n");CHKERRQ(ierr); 779cb1e1211SMatthew G Knepley for (p = 0; p < numProcs; ++p) { 780cb1e1211SMatthew G Knepley if (p == rank) {ierr = VecView(F, PETSC_VIEWER_STDOUT_SELF);CHKERRQ(ierr);} 781cb1e1211SMatthew G Knepley ierr = PetscBarrier((PetscObject) dm);CHKERRQ(ierr); 782cb1e1211SMatthew G Knepley } 783cb1e1211SMatthew G Knepley } 7840483ade4SMatthew G. Knepley /* ierr = PetscLogEventEnd(DMPLEX_JacobianActionFEM,dm,0,0,0);CHKERRQ(ierr); */ 785cb1e1211SMatthew G Knepley PetscFunctionReturn(0); 786cb1e1211SMatthew G Knepley } 787cb1e1211SMatthew G Knepley 788cb1e1211SMatthew G Knepley #undef __FUNCT__ 789cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexComputeJacobianFEM" 790cb1e1211SMatthew G Knepley /*@ 791cb1e1211SMatthew G Knepley DMPlexComputeJacobianFEM - Form the local portion of the Jacobian matrix J at the local solution X using pointwise functions specified by the user. 792cb1e1211SMatthew G Knepley 793cb1e1211SMatthew G Knepley Input Parameters: 794cb1e1211SMatthew G Knepley + dm - The mesh 795cb1e1211SMatthew G Knepley . X - Local input vector 796cb1e1211SMatthew G Knepley - user - The user context 797cb1e1211SMatthew G Knepley 798cb1e1211SMatthew G Knepley Output Parameter: 799cb1e1211SMatthew G Knepley . Jac - Jacobian matrix 800cb1e1211SMatthew G Knepley 801cb1e1211SMatthew G Knepley Note: 802cb1e1211SMatthew G Knepley The second member of the user context must be an FEMContext. 803cb1e1211SMatthew G Knepley 804cb1e1211SMatthew G Knepley We form the residual one batch of elements at a time. This allows us to offload work onto an accelerator, 805cb1e1211SMatthew G Knepley like a GPU, or vectorize on a multicore machine. 806cb1e1211SMatthew G Knepley 8070059ad2aSSatish Balay Level: developer 8080059ad2aSSatish Balay 809cb1e1211SMatthew G Knepley .seealso: FormFunctionLocal() 810878cb397SSatish Balay @*/ 811cb1e1211SMatthew G Knepley PetscErrorCode DMPlexComputeJacobianFEM(DM dm, Vec X, Mat Jac, Mat JacP, MatStructure *str,void *user) 812cb1e1211SMatthew G Knepley { 813cb1e1211SMatthew G Knepley DM_Plex *mesh = (DM_Plex *) dm->data; 8149a559087SMatthew G. Knepley PetscFEM *fem = (PetscFEM *) user; 815a319912fSMatthew G. Knepley PetscFE *fe = fem->fe; 816754551f4SMatthew G. Knepley PetscFE *feAux = fem->feAux; 817a319912fSMatthew G. Knepley const char *name = "Jacobian"; 818754551f4SMatthew G. Knepley DM dmAux; 819754551f4SMatthew G. Knepley Vec A; 820a319912fSMatthew G. Knepley PetscQuadrature quad; 821a319912fSMatthew G. Knepley PetscCellGeometry geom; 822754551f4SMatthew G. Knepley PetscSection section, globalSection, sectionAux; 823cb1e1211SMatthew G Knepley PetscReal *v0, *J, *invJ, *detJ; 824754551f4SMatthew G. Knepley PetscScalar *elemMat, *u, *a; 825754551f4SMatthew G. Knepley PetscInt dim, Nf, NfAux = 0, f, fieldI, fieldJ, numCells, cStart, cEnd, c; 826cb1e1211SMatthew G Knepley PetscInt cellDof = 0, numComponents = 0; 827754551f4SMatthew G. Knepley PetscInt cellDofAux = 0, numComponentsAux = 0; 828cb1e1211SMatthew G Knepley PetscBool isShell; 829cb1e1211SMatthew G Knepley PetscErrorCode ierr; 830cb1e1211SMatthew G Knepley 831cb1e1211SMatthew G Knepley PetscFunctionBegin; 832a319912fSMatthew G. Knepley ierr = PetscLogEventBegin(DMPLEX_JacobianFEM,dm,0,0,0);CHKERRQ(ierr); 833cb1e1211SMatthew G Knepley ierr = DMPlexGetDimension(dm, &dim);CHKERRQ(ierr); 834cb1e1211SMatthew G Knepley ierr = DMGetDefaultSection(dm, §ion);CHKERRQ(ierr); 835a319912fSMatthew G. Knepley ierr = DMGetDefaultGlobalSection(dm, &globalSection);CHKERRQ(ierr); 836754551f4SMatthew G. Knepley ierr = PetscSectionGetNumFields(section, &Nf);CHKERRQ(ierr); 837cb1e1211SMatthew G Knepley ierr = DMPlexGetHeightStratum(dm, 0, &cStart, &cEnd);CHKERRQ(ierr); 838cb1e1211SMatthew G Knepley numCells = cEnd - cStart; 839754551f4SMatthew G. Knepley for (f = 0; f < Nf; ++f) { 840a319912fSMatthew G. Knepley PetscInt Nb, Nc; 841a319912fSMatthew G. Knepley 842a319912fSMatthew G. Knepley ierr = PetscFEGetDimension(fe[f], &Nb);CHKERRQ(ierr); 843a319912fSMatthew G. Knepley ierr = PetscFEGetNumComponents(fe[f], &Nc);CHKERRQ(ierr); 844a319912fSMatthew G. Knepley cellDof += Nb*Nc; 845a319912fSMatthew G. Knepley numComponents += Nc; 846cb1e1211SMatthew G Knepley } 847754551f4SMatthew G. Knepley ierr = PetscObjectQuery((PetscObject) dm, "dmAux", (PetscObject *) &dmAux);CHKERRQ(ierr); 848754551f4SMatthew G. Knepley ierr = PetscObjectQuery((PetscObject) dm, "A", (PetscObject *) &A);CHKERRQ(ierr); 849754551f4SMatthew G. Knepley if (dmAux) { 850754551f4SMatthew G. Knepley ierr = DMGetDefaultSection(dmAux, §ionAux);CHKERRQ(ierr); 851754551f4SMatthew G. Knepley ierr = PetscSectionGetNumFields(sectionAux, &NfAux);CHKERRQ(ierr); 852754551f4SMatthew G. Knepley } 853754551f4SMatthew G. Knepley for (f = 0; f < NfAux; ++f) { 854754551f4SMatthew G. Knepley PetscInt Nb, Nc; 855754551f4SMatthew G. Knepley 856754551f4SMatthew G. Knepley ierr = PetscFEGetDimension(feAux[f], &Nb);CHKERRQ(ierr); 857754551f4SMatthew G. Knepley ierr = PetscFEGetNumComponents(feAux[f], &Nc);CHKERRQ(ierr); 858754551f4SMatthew G. Knepley cellDofAux += Nb*Nc; 859754551f4SMatthew G. Knepley numComponentsAux += Nc; 860754551f4SMatthew G. Knepley } 86172f94c41SMatthew G. Knepley ierr = DMPlexProjectFunctionLocal(dm, fe, fem->bcFuncs, INSERT_BC_VALUES, X);CHKERRQ(ierr); 862cb1e1211SMatthew G Knepley ierr = MatZeroEntries(JacP);CHKERRQ(ierr); 863dcca6d9dSJed Brown ierr = PetscMalloc6(numCells*cellDof,&u,numCells*dim,&v0,numCells*dim*dim,&J,numCells*dim*dim,&invJ,numCells,&detJ,numCells*cellDof*cellDof,&elemMat);CHKERRQ(ierr); 864785e854fSJed Brown if (dmAux) {ierr = PetscMalloc1(numCells*cellDofAux, &a);CHKERRQ(ierr);} 865cb1e1211SMatthew G Knepley for (c = cStart; c < cEnd; ++c) { 866a1e44745SMatthew G. Knepley PetscScalar *x = NULL; 867cb1e1211SMatthew G Knepley PetscInt i; 868cb1e1211SMatthew G Knepley 869cb1e1211SMatthew G Knepley ierr = DMPlexComputeCellGeometry(dm, c, &v0[c*dim], &J[c*dim*dim], &invJ[c*dim*dim], &detJ[c]);CHKERRQ(ierr); 870cb1e1211SMatthew G Knepley if (detJ[c] <= 0.0) SETERRQ2(PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Invalid determinant %g for element %d", detJ[c], c); 871a319912fSMatthew G. Knepley ierr = DMPlexVecGetClosure(dm, section, X, c, NULL, &x);CHKERRQ(ierr); 872cb1e1211SMatthew G Knepley for (i = 0; i < cellDof; ++i) u[c*cellDof+i] = x[i]; 873a319912fSMatthew G. Knepley ierr = DMPlexVecRestoreClosure(dm, section, X, c, NULL, &x);CHKERRQ(ierr); 874754551f4SMatthew G. Knepley if (dmAux) { 875754551f4SMatthew G. Knepley ierr = DMPlexVecGetClosure(dmAux, sectionAux, A, c, NULL, &x);CHKERRQ(ierr); 876754551f4SMatthew G. Knepley for (i = 0; i < cellDofAux; ++i) a[c*cellDofAux+i] = x[i]; 877754551f4SMatthew G. Knepley ierr = DMPlexVecRestoreClosure(dmAux, sectionAux, A, c, NULL, &x);CHKERRQ(ierr); 878754551f4SMatthew G. Knepley } 879cb1e1211SMatthew G Knepley } 880cb1e1211SMatthew G Knepley ierr = PetscMemzero(elemMat, numCells*cellDof*cellDof * sizeof(PetscScalar));CHKERRQ(ierr); 881754551f4SMatthew G. Knepley for (fieldI = 0; fieldI < Nf; ++fieldI) { 882a319912fSMatthew G. Knepley PetscInt Nb; 883cb1e1211SMatthew G Knepley /* Conforming batches */ 884754551f4SMatthew G. Knepley PetscInt numChunks, numBatches, numBlocks, Ne, blockSize, batchSize; 885cb1e1211SMatthew G Knepley /* Remainder */ 886a319912fSMatthew G. Knepley PetscInt Nr, offset; 887cb1e1211SMatthew G Knepley 888754551f4SMatthew G. Knepley ierr = PetscFEGetQuadrature(fe[fieldI], &quad);CHKERRQ(ierr); 889754551f4SMatthew G. Knepley ierr = PetscFEGetDimension(fe[fieldI], &Nb);CHKERRQ(ierr); 890754551f4SMatthew G. Knepley ierr = PetscFEGetTileSizes(fe[fieldI], NULL, &numBlocks, NULL, &numBatches);CHKERRQ(ierr); 891f9fd7fdbSMatthew G. Knepley blockSize = Nb*quad.numPoints; 892a319912fSMatthew G. Knepley batchSize = numBlocks * blockSize; 893754551f4SMatthew G. Knepley ierr = PetscFESetTileSizes(fe[fieldI], blockSize, numBlocks, batchSize, numBatches);CHKERRQ(ierr); 894a319912fSMatthew G. Knepley numChunks = numCells / (numBatches*batchSize); 895a319912fSMatthew G. Knepley Ne = numChunks*numBatches*batchSize; 896a319912fSMatthew G. Knepley Nr = numCells % (numBatches*batchSize); 897a319912fSMatthew G. Knepley offset = numCells - Nr; 898754551f4SMatthew G. Knepley for (fieldJ = 0; fieldJ < Nf; ++fieldJ) { 899754551f4SMatthew G. Knepley void (*g0)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], PetscScalar[]) = fem->g0Funcs[fieldI*Nf+fieldJ]; 900754551f4SMatthew G. Knepley void (*g1)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], PetscScalar[]) = fem->g1Funcs[fieldI*Nf+fieldJ]; 901754551f4SMatthew G. Knepley void (*g2)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], PetscScalar[]) = fem->g2Funcs[fieldI*Nf+fieldJ]; 902754551f4SMatthew G. Knepley void (*g3)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], PetscScalar[]) = fem->g3Funcs[fieldI*Nf+fieldJ]; 903754551f4SMatthew G. Knepley 904a319912fSMatthew G. Knepley geom.v0 = v0; 905a319912fSMatthew G. Knepley geom.J = J; 906a319912fSMatthew G. Knepley geom.invJ = invJ; 907a319912fSMatthew G. Knepley geom.detJ = detJ; 908754551f4SMatthew G. Knepley ierr = PetscFEIntegrateJacobian(fe[fieldI], Ne, Nf, fe, fieldI, fieldJ, geom, u, NfAux, feAux, a, g0, g1, g2, g3, elemMat);CHKERRQ(ierr); 909a319912fSMatthew G. Knepley geom.v0 = &v0[offset*dim]; 910a319912fSMatthew G. Knepley geom.J = &J[offset*dim*dim]; 911a319912fSMatthew G. Knepley geom.invJ = &invJ[offset*dim*dim]; 912a319912fSMatthew G. Knepley geom.detJ = &detJ[offset]; 913754551f4SMatthew G. Knepley ierr = PetscFEIntegrateJacobian(fe[fieldI], Nr, Nf, fe, fieldI, fieldJ, geom, &u[offset*cellDof], NfAux, feAux, &a[offset*cellDofAux], g0, g1, g2, g3, &elemMat[offset*cellDof*cellDof]);CHKERRQ(ierr); 914cb1e1211SMatthew G Knepley } 915cb1e1211SMatthew G Knepley } 916cb1e1211SMatthew G Knepley for (c = cStart; c < cEnd; ++c) { 917a319912fSMatthew G. Knepley if (mesh->printFEM > 1) {ierr = DMPrintCellMatrix(c, name, cellDof, cellDof, &elemMat[c*cellDof*cellDof]);CHKERRQ(ierr);} 918a319912fSMatthew G. Knepley ierr = DMPlexMatSetClosure(dm, section, globalSection, JacP, c, &elemMat[c*cellDof*cellDof], ADD_VALUES);CHKERRQ(ierr); 919cb1e1211SMatthew G Knepley } 920cb1e1211SMatthew G Knepley ierr = PetscFree6(u,v0,J,invJ,detJ,elemMat);CHKERRQ(ierr); 921754551f4SMatthew G. Knepley if (dmAux) {ierr = PetscFree(a);CHKERRQ(ierr);} 922cb1e1211SMatthew G Knepley ierr = MatAssemblyBegin(JacP, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 923cb1e1211SMatthew G Knepley ierr = MatAssemblyEnd(JacP, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 924cb1e1211SMatthew G Knepley if (mesh->printFEM) { 925a319912fSMatthew G. Knepley ierr = PetscPrintf(PETSC_COMM_WORLD, "%s:\n", name);CHKERRQ(ierr); 926cb1e1211SMatthew G Knepley ierr = MatChop(JacP, 1.0e-10);CHKERRQ(ierr); 927cb1e1211SMatthew G Knepley ierr = MatView(JacP, PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 928cb1e1211SMatthew G Knepley } 929a319912fSMatthew G. Knepley ierr = PetscLogEventEnd(DMPLEX_JacobianFEM,dm,0,0,0);CHKERRQ(ierr); 930cb1e1211SMatthew G Knepley ierr = PetscObjectTypeCompare((PetscObject) Jac, MATSHELL, &isShell);CHKERRQ(ierr); 931cb1e1211SMatthew G Knepley if (isShell) { 932cb1e1211SMatthew G Knepley JacActionCtx *jctx; 933cb1e1211SMatthew G Knepley 934cb1e1211SMatthew G Knepley ierr = MatShellGetContext(Jac, &jctx);CHKERRQ(ierr); 935cb1e1211SMatthew G Knepley ierr = VecCopy(X, jctx->u);CHKERRQ(ierr); 936cb1e1211SMatthew G Knepley } 937cb1e1211SMatthew G Knepley *str = SAME_NONZERO_PATTERN; 938cb1e1211SMatthew G Knepley PetscFunctionReturn(0); 939cb1e1211SMatthew G Knepley } 940