1ed264d09SValeria Barra // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at 2ed264d09SValeria Barra // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights 3ed264d09SValeria Barra // reserved. See files LICENSE and NOTICE for details. 4ed264d09SValeria Barra // 5ed264d09SValeria Barra // This file is part of CEED, a collection of benchmarks, miniapps, software 6ed264d09SValeria Barra // libraries and APIs for efficient high-order finite element and spectral 7ed264d09SValeria Barra // element discretizations for exascale applications. For more information and 8ed264d09SValeria Barra // source code availability see http://github.com/ceed. 9ed264d09SValeria Barra // 10ed264d09SValeria Barra // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 11ed264d09SValeria Barra // a collaborative effort of two U.S. Department of Energy organizations (Office 12ed264d09SValeria Barra // of Science and the National Nuclear Security Administration) responsible for 13ed264d09SValeria Barra // the planning and preparation of a capable exascale ecosystem, including 14ed264d09SValeria Barra // software, applications, hardware, advanced system engineering and early 15ed264d09SValeria Barra // testbed platforms, in support of the nation's exascale computing imperative. 16ed264d09SValeria Barra 17ed264d09SValeria Barra /// @file 18ed264d09SValeria Barra /// libCEED QFunctions for mass operator example for a scalar field on the sphere using PETSc 19ed264d09SValeria Barra 20f6b55d2cSvaleriabarra #ifndef bp1sphere_h 21f6b55d2cSvaleriabarra #define bp1sphere_h 22f6b55d2cSvaleriabarra 23ed264d09SValeria Barra #ifndef __CUDACC__ 24ed264d09SValeria Barra # include <math.h> 25ed264d09SValeria Barra #endif 26ed264d09SValeria Barra 27e83e87a5Sjeremylt // ----------------------------------------------------------------------------- 28ed264d09SValeria Barra // This QFunction sets up the geometric factors required for integration and 29ed264d09SValeria Barra // coordinate transformations when reference coordinates have a different 30ed264d09SValeria Barra // dimension than the one of physical coordinates 31ed264d09SValeria Barra // 32ed264d09SValeria Barra // Reference (parent) 2D coordinates: X \in [-1, 1]^2 33ed264d09SValeria Barra // 34ed264d09SValeria Barra // Global 3D physical coordinates given by the mesh: xx \in [-R, R]^3 35ed264d09SValeria Barra // with R radius of the sphere 36ed264d09SValeria Barra // 37ed264d09SValeria Barra // Local 3D physical coordinates on the 2D manifold: x \in [-l, l]^3 38ed264d09SValeria Barra // with l half edge of the cube inscribed in the sphere 39ed264d09SValeria Barra // 40ed264d09SValeria Barra // Change of coordinates matrix computed by the library: 41ed264d09SValeria Barra // (physical 3D coords relative to reference 2D coords) 42ed264d09SValeria Barra // dxx_j/dX_i (indicial notation) [3 * 2] 43ed264d09SValeria Barra // 44ed264d09SValeria Barra // Change of coordinates x (on the 2D manifold) relative to xx (phyisical 3D): 45ed264d09SValeria Barra // dx_i/dxx_j (indicial notation) [3 * 3] 46ed264d09SValeria Barra // 47ed264d09SValeria Barra // Change of coordinates x (on the 2D manifold) relative to X (reference 2D): 48ed264d09SValeria Barra // (by chain rule) 49ed264d09SValeria Barra // dx_i/dX_j [3 * 2] = dx_i/dxx_k [3 * 3] * dxx_k/dX_j [3 * 2] 50ed264d09SValeria Barra // 51*9b072555Sjeremylt // mod_J is given by the magnitude of the cross product of the columns of dx_i/dX_j 52ed264d09SValeria Barra // 53*9b072555Sjeremylt // The quadrature data is stored in the array q_data. 54ed264d09SValeria Barra // 55ed264d09SValeria Barra // We require the determinant of the Jacobian to properly compute integrals of 56ed264d09SValeria Barra // the form: int( u v ) 57ed264d09SValeria Barra // 58*9b072555Sjeremylt // Qdata: mod_J * w 59ed264d09SValeria Barra // 60e83e87a5Sjeremylt // ----------------------------------------------------------------------------- 61ed264d09SValeria Barra CEED_QFUNCTION(SetupMassGeo)(void *ctx, const CeedInt Q, 62ed264d09SValeria Barra const CeedScalar *const *in, 63ed264d09SValeria Barra CeedScalar *const *out) { 64ed264d09SValeria Barra // Inputs 65ed264d09SValeria Barra const CeedScalar *X = in[0], *J = in[1], *w = in[2]; 66ed264d09SValeria Barra // Outputs 67*9b072555Sjeremylt CeedScalar *q_data = out[0]; 68ed264d09SValeria Barra 69ed264d09SValeria Barra // Quadrature Point Loop 70ed264d09SValeria Barra CeedPragmaSIMD 71ed264d09SValeria Barra for (CeedInt i=0; i<Q; i++) { 72ed264d09SValeria Barra // Read global Cartesian coordinates 73ed264d09SValeria Barra const CeedScalar xx[3] = {X[i+0*Q], 74ed264d09SValeria Barra X[i+1*Q], 75ed264d09SValeria Barra X[i+2*Q] 76ed264d09SValeria Barra }; 77ed264d09SValeria Barra 78ed264d09SValeria Barra // Read dxxdX Jacobian entries, stored as 79ed264d09SValeria Barra // 0 3 80ed264d09SValeria Barra // 1 4 81ed264d09SValeria Barra // 2 5 82ed264d09SValeria Barra const CeedScalar dxxdX[3][2] = {{J[i+Q*0], 83ed264d09SValeria Barra J[i+Q*3]}, 84ed264d09SValeria Barra {J[i+Q*1], 85ed264d09SValeria Barra J[i+Q*4]}, 86ed264d09SValeria Barra {J[i+Q*2], 87ed264d09SValeria Barra J[i+Q*5]} 88ed264d09SValeria Barra }; 89ed264d09SValeria Barra 90ed264d09SValeria Barra // Setup 91ed264d09SValeria Barra // x = xx (xx^T xx)^{-1/2} 92ed264d09SValeria Barra // dx/dxx = I (xx^T xx)^{-1/2} - xx xx^T (xx^T xx)^{-3/2} 93*9b072555Sjeremylt const CeedScalar mod_xx_sq = xx[0]*xx[0]+xx[1]*xx[1]+xx[2]*xx[2]; 94*9b072555Sjeremylt CeedScalar xx_sq[3][3]; 95ed264d09SValeria Barra for (int j=0; j<3; j++) 96ed264d09SValeria Barra for (int k=0; k<3; k++) 97*9b072555Sjeremylt xx_sq[j][k] = xx[j]*xx[k] / (sqrt(mod_xx_sq) * mod_xx_sq); 98ed264d09SValeria Barra 99*9b072555Sjeremylt const CeedScalar dxdxx[3][3] = {{1./sqrt(mod_xx_sq) - xx_sq[0][0], 100*9b072555Sjeremylt -xx_sq[0][1], 101*9b072555Sjeremylt -xx_sq[0][2]}, 102*9b072555Sjeremylt {-xx_sq[1][0], 103*9b072555Sjeremylt 1./sqrt(mod_xx_sq) - xx_sq[1][1], 104*9b072555Sjeremylt -xx_sq[1][2]}, 105*9b072555Sjeremylt {-xx_sq[2][0], 106*9b072555Sjeremylt -xx_sq[2][1], 107*9b072555Sjeremylt 1./sqrt(mod_xx_sq) - xx_sq[2][2]} 108ed264d09SValeria Barra }; 109ed264d09SValeria Barra 110ed264d09SValeria Barra CeedScalar dxdX[3][2]; 111ed264d09SValeria Barra for (int j=0; j<3; j++) 112ed264d09SValeria Barra for (int k=0; k<2; k++) { 113ed264d09SValeria Barra dxdX[j][k] = 0; 114ed264d09SValeria Barra for (int l=0; l<3; l++) 115ed264d09SValeria Barra dxdX[j][k] += dxdxx[j][l]*dxxdX[l][k]; 116ed264d09SValeria Barra } 117ed264d09SValeria Barra 118ed264d09SValeria Barra // J is given by the cross product of the columns of dxdX 119ed264d09SValeria Barra const CeedScalar J[3] = {dxdX[1][0]*dxdX[2][1] - dxdX[2][0]*dxdX[1][1], 120ed264d09SValeria Barra dxdX[2][0]*dxdX[0][1] - dxdX[0][0]*dxdX[2][1], 121ed264d09SValeria Barra dxdX[0][0]*dxdX[1][1] - dxdX[1][0]*dxdX[0][1] 122ed264d09SValeria Barra }; 123ed264d09SValeria Barra 124ed264d09SValeria Barra // Use the magnitude of J as our detJ (volume scaling factor) 125*9b072555Sjeremylt const CeedScalar mod_J = sqrt(J[0]*J[0]+J[1]*J[1]+J[2]*J[2]); 126ed264d09SValeria Barra 127*9b072555Sjeremylt // Interp-to-Interp q_data 128*9b072555Sjeremylt q_data[i+Q*0] = mod_J * w[i]; 129ed264d09SValeria Barra } // End of Quadrature Point Loop 130ed264d09SValeria Barra 131ed264d09SValeria Barra return 0; 132ed264d09SValeria Barra } 133ed264d09SValeria Barra 134e83e87a5Sjeremylt // ----------------------------------------------------------------------------- 135ed264d09SValeria Barra // This QFunction sets up the rhs and true solution for the problem 136ed264d09SValeria Barra // ----------------------------------------------------------------------------- 137ed264d09SValeria Barra CEED_QFUNCTION(SetupMassRhs)(void *ctx, const CeedInt Q, 138ed264d09SValeria Barra const CeedScalar *const *in, 139ed264d09SValeria Barra CeedScalar *const *out) { 140ed264d09SValeria Barra // Inputs 141*9b072555Sjeremylt const CeedScalar *X = in[0], *q_data = in[1]; 142ed264d09SValeria Barra // Outputs 143ed264d09SValeria Barra CeedScalar *true_soln = out[0], *rhs = out[1]; 144ed264d09SValeria Barra 145ed264d09SValeria Barra // Context 146ed264d09SValeria Barra const CeedScalar *context = (const CeedScalar*)ctx; 147ed264d09SValeria Barra const CeedScalar R = context[0]; 148ed264d09SValeria Barra 149ed264d09SValeria Barra // Quadrature Point Loop 150ed264d09SValeria Barra CeedPragmaSIMD 151ed264d09SValeria Barra for (CeedInt i=0; i<Q; i++) { 152ed264d09SValeria Barra // Compute latitude 153ed264d09SValeria Barra const CeedScalar theta = asin(X[i+2*Q] / R); 154ed264d09SValeria Barra 155*9b072555Sjeremylt // Use absolute value of latitude for true solution 156ed264d09SValeria Barra true_soln[i] = fabs(theta); 157ed264d09SValeria Barra 158*9b072555Sjeremylt rhs[i] = q_data[i] * true_soln[i]; 159ed264d09SValeria Barra } // End of Quadrature Point Loop 160ed264d09SValeria Barra 161ed264d09SValeria Barra return 0; 162ed264d09SValeria Barra } 163ed264d09SValeria Barra 164e83e87a5Sjeremylt // ----------------------------------------------------------------------------- 165ed264d09SValeria Barra // This QFunction applies the mass operator for a scalar field. 166ed264d09SValeria Barra // 167ed264d09SValeria Barra // Inputs: 168ed264d09SValeria Barra // u - Input vector at quadrature points 169*9b072555Sjeremylt // q_data - Geometric factors 170ed264d09SValeria Barra // 171ed264d09SValeria Barra // Output: 172ed264d09SValeria Barra // v - Output vector (test functions) at quadrature points 173ed264d09SValeria Barra // 174ed264d09SValeria Barra // ----------------------------------------------------------------------------- 175ed264d09SValeria Barra CEED_QFUNCTION(Mass)(void *ctx, const CeedInt Q, 176ed264d09SValeria Barra const CeedScalar *const *in, CeedScalar *const *out) { 177ed264d09SValeria Barra // Inputs 178*9b072555Sjeremylt const CeedScalar *u = in[0], *q_data = in[1]; 179ed264d09SValeria Barra // Outputs 180ed264d09SValeria Barra CeedScalar *v = out[0]; 181ed264d09SValeria Barra 182ed264d09SValeria Barra // Quadrature Point Loop 183ed264d09SValeria Barra CeedPragmaSIMD 184ed264d09SValeria Barra for (CeedInt i=0; i<Q; i++) 185*9b072555Sjeremylt v[i] = q_data[i] * u[i]; 186ed264d09SValeria Barra 187ed264d09SValeria Barra return 0; 188ed264d09SValeria Barra } 189ed264d09SValeria Barra // ----------------------------------------------------------------------------- 190f6b55d2cSvaleriabarra 191f6b55d2cSvaleriabarra #endif // bp1sphere_h 192