1*ed264d09SValeria Barra // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at 2*ed264d09SValeria Barra // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights 3*ed264d09SValeria Barra // reserved. See files LICENSE and NOTICE for details. 4*ed264d09SValeria Barra // 5*ed264d09SValeria Barra // This file is part of CEED, a collection of benchmarks, miniapps, software 6*ed264d09SValeria Barra // libraries and APIs for efficient high-order finite element and spectral 7*ed264d09SValeria Barra // element discretizations for exascale applications. For more information and 8*ed264d09SValeria Barra // source code availability see http://github.com/ceed. 9*ed264d09SValeria Barra // 10*ed264d09SValeria Barra // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 11*ed264d09SValeria Barra // a collaborative effort of two U.S. Department of Energy organizations (Office 12*ed264d09SValeria Barra // of Science and the National Nuclear Security Administration) responsible for 13*ed264d09SValeria Barra // the planning and preparation of a capable exascale ecosystem, including 14*ed264d09SValeria Barra // software, applications, hardware, advanced system engineering and early 15*ed264d09SValeria Barra // testbed platforms, in support of the nation's exascale computing imperative. 16*ed264d09SValeria Barra 17*ed264d09SValeria Barra /// @file 18*ed264d09SValeria Barra /// libCEED QFunctions for mass operator example for a scalar field on the sphere using PETSc 19*ed264d09SValeria Barra 20*ed264d09SValeria Barra #ifndef __CUDACC__ 21*ed264d09SValeria Barra # include <math.h> 22*ed264d09SValeria Barra #endif 23*ed264d09SValeria Barra 24*ed264d09SValeria Barra // ***************************************************************************** 25*ed264d09SValeria Barra // This QFunction sets up the geometric factors required for integration and 26*ed264d09SValeria Barra // coordinate transformations when reference coordinates have a different 27*ed264d09SValeria Barra // dimension than the one of physical coordinates 28*ed264d09SValeria Barra // 29*ed264d09SValeria Barra // Reference (parent) 2D coordinates: X \in [-1, 1]^2 30*ed264d09SValeria Barra // 31*ed264d09SValeria Barra // Global 3D physical coordinates given by the mesh: xx \in [-R, R]^3 32*ed264d09SValeria Barra // with R radius of the sphere 33*ed264d09SValeria Barra // 34*ed264d09SValeria Barra // Local 3D physical coordinates on the 2D manifold: x \in [-l, l]^3 35*ed264d09SValeria Barra // with l half edge of the cube inscribed in the sphere 36*ed264d09SValeria Barra // 37*ed264d09SValeria Barra // Change of coordinates matrix computed by the library: 38*ed264d09SValeria Barra // (physical 3D coords relative to reference 2D coords) 39*ed264d09SValeria Barra // dxx_j/dX_i (indicial notation) [3 * 2] 40*ed264d09SValeria Barra // 41*ed264d09SValeria Barra // Change of coordinates x (on the 2D manifold) relative to xx (phyisical 3D): 42*ed264d09SValeria Barra // dx_i/dxx_j (indicial notation) [3 * 3] 43*ed264d09SValeria Barra // 44*ed264d09SValeria Barra // Change of coordinates x (on the 2D manifold) relative to X (reference 2D): 45*ed264d09SValeria Barra // (by chain rule) 46*ed264d09SValeria Barra // dx_i/dX_j [3 * 2] = dx_i/dxx_k [3 * 3] * dxx_k/dX_j [3 * 2] 47*ed264d09SValeria Barra // 48*ed264d09SValeria Barra // modJ is given by the magnitude of the cross product of the columns of dx_i/dX_j 49*ed264d09SValeria Barra // 50*ed264d09SValeria Barra // The quadrature data is stored in the array qdata. 51*ed264d09SValeria Barra // 52*ed264d09SValeria Barra // We require the determinant of the Jacobian to properly compute integrals of 53*ed264d09SValeria Barra // the form: int( u v ) 54*ed264d09SValeria Barra // 55*ed264d09SValeria Barra // Qdata: modJ * w 56*ed264d09SValeria Barra // 57*ed264d09SValeria Barra // ***************************************************************************** 58*ed264d09SValeria Barra 59*ed264d09SValeria Barra // ***************************************************************************** 60*ed264d09SValeria Barra CEED_QFUNCTION(SetupMassGeo)(void *ctx, const CeedInt Q, 61*ed264d09SValeria Barra const CeedScalar *const *in, 62*ed264d09SValeria Barra CeedScalar *const *out) { 63*ed264d09SValeria Barra // Inputs 64*ed264d09SValeria Barra const CeedScalar *X = in[0], *J = in[1], *w = in[2]; 65*ed264d09SValeria Barra // Outputs 66*ed264d09SValeria Barra CeedScalar *qdata = out[0]; 67*ed264d09SValeria Barra 68*ed264d09SValeria Barra // Quadrature Point Loop 69*ed264d09SValeria Barra CeedPragmaSIMD 70*ed264d09SValeria Barra for (CeedInt i=0; i<Q; i++) { 71*ed264d09SValeria Barra // Read global Cartesian coordinates 72*ed264d09SValeria Barra const CeedScalar xx[3] = {X[i+0*Q], 73*ed264d09SValeria Barra X[i+1*Q], 74*ed264d09SValeria Barra X[i+2*Q] 75*ed264d09SValeria Barra }; 76*ed264d09SValeria Barra 77*ed264d09SValeria Barra // Read dxxdX Jacobian entries, stored as 78*ed264d09SValeria Barra // 0 3 79*ed264d09SValeria Barra // 1 4 80*ed264d09SValeria Barra // 2 5 81*ed264d09SValeria Barra const CeedScalar dxxdX[3][2] = {{J[i+Q*0], 82*ed264d09SValeria Barra J[i+Q*3]}, 83*ed264d09SValeria Barra {J[i+Q*1], 84*ed264d09SValeria Barra J[i+Q*4]}, 85*ed264d09SValeria Barra {J[i+Q*2], 86*ed264d09SValeria Barra J[i+Q*5]} 87*ed264d09SValeria Barra }; 88*ed264d09SValeria Barra 89*ed264d09SValeria Barra // Setup 90*ed264d09SValeria Barra // x = xx (xx^T xx)^{-1/2} 91*ed264d09SValeria Barra // dx/dxx = I (xx^T xx)^{-1/2} - xx xx^T (xx^T xx)^{-3/2} 92*ed264d09SValeria Barra const CeedScalar modxxsq = xx[0]*xx[0]+xx[1]*xx[1]+xx[2]*xx[2]; 93*ed264d09SValeria Barra CeedScalar xxsq[3][3]; 94*ed264d09SValeria Barra for (int j=0; j<3; j++) 95*ed264d09SValeria Barra for (int k=0; k<3; k++) 96*ed264d09SValeria Barra xxsq[j][k] = xx[j]*xx[k] / (sqrt(modxxsq) * modxxsq); 97*ed264d09SValeria Barra 98*ed264d09SValeria Barra const CeedScalar dxdxx[3][3] = {{1./sqrt(modxxsq) - xxsq[0][0], 99*ed264d09SValeria Barra -xxsq[0][1], 100*ed264d09SValeria Barra -xxsq[0][2]}, 101*ed264d09SValeria Barra {-xxsq[1][0], 102*ed264d09SValeria Barra 1./sqrt(modxxsq) - xxsq[1][1], 103*ed264d09SValeria Barra -xxsq[1][2]}, 104*ed264d09SValeria Barra {-xxsq[2][0], 105*ed264d09SValeria Barra -xxsq[2][1], 106*ed264d09SValeria Barra 1./sqrt(modxxsq) - xxsq[2][2]} 107*ed264d09SValeria Barra }; 108*ed264d09SValeria Barra 109*ed264d09SValeria Barra CeedScalar dxdX[3][2]; 110*ed264d09SValeria Barra for (int j=0; j<3; j++) 111*ed264d09SValeria Barra for (int k=0; k<2; k++) { 112*ed264d09SValeria Barra dxdX[j][k] = 0; 113*ed264d09SValeria Barra for (int l=0; l<3; l++) 114*ed264d09SValeria Barra dxdX[j][k] += dxdxx[j][l]*dxxdX[l][k]; 115*ed264d09SValeria Barra } 116*ed264d09SValeria Barra 117*ed264d09SValeria Barra // J is given by the cross product of the columns of dxdX 118*ed264d09SValeria Barra const CeedScalar J[3] = {dxdX[1][0]*dxdX[2][1] - dxdX[2][0]*dxdX[1][1], 119*ed264d09SValeria Barra dxdX[2][0]*dxdX[0][1] - dxdX[0][0]*dxdX[2][1], 120*ed264d09SValeria Barra dxdX[0][0]*dxdX[1][1] - dxdX[1][0]*dxdX[0][1] 121*ed264d09SValeria Barra }; 122*ed264d09SValeria Barra 123*ed264d09SValeria Barra // Use the magnitude of J as our detJ (volume scaling factor) 124*ed264d09SValeria Barra const CeedScalar modJ = sqrt(J[0]*J[0]+J[1]*J[1]+J[2]*J[2]); 125*ed264d09SValeria Barra 126*ed264d09SValeria Barra // Interp-to-Interp qdata 127*ed264d09SValeria Barra qdata[i+Q*0] = modJ * w[i]; 128*ed264d09SValeria Barra } // End of Quadrature Point Loop 129*ed264d09SValeria Barra 130*ed264d09SValeria Barra return 0; 131*ed264d09SValeria Barra } 132*ed264d09SValeria Barra 133*ed264d09SValeria Barra // ***************************************************************************** 134*ed264d09SValeria Barra // This QFunction sets up the rhs and true solution for the problem 135*ed264d09SValeria Barra // ***************************************************************************** 136*ed264d09SValeria Barra 137*ed264d09SValeria Barra // ----------------------------------------------------------------------------- 138*ed264d09SValeria Barra CEED_QFUNCTION(SetupMassRhs)(void *ctx, const CeedInt Q, 139*ed264d09SValeria Barra const CeedScalar *const *in, 140*ed264d09SValeria Barra CeedScalar *const *out) { 141*ed264d09SValeria Barra // Inputs 142*ed264d09SValeria Barra const CeedScalar *X = in[0], *qdata = in[1]; 143*ed264d09SValeria Barra // Outputs 144*ed264d09SValeria Barra CeedScalar *true_soln = out[0], *rhs = out[1]; 145*ed264d09SValeria Barra 146*ed264d09SValeria Barra // Context 147*ed264d09SValeria Barra const CeedScalar *context = (const CeedScalar*)ctx; 148*ed264d09SValeria Barra const CeedScalar R = context[0]; 149*ed264d09SValeria Barra 150*ed264d09SValeria Barra // Quadrature Point Loop 151*ed264d09SValeria Barra CeedPragmaSIMD 152*ed264d09SValeria Barra for (CeedInt i=0; i<Q; i++) { 153*ed264d09SValeria Barra // Compute latitude 154*ed264d09SValeria Barra const CeedScalar theta = asin(X[i+2*Q] / R); 155*ed264d09SValeria Barra 156*ed264d09SValeria Barra // Use absolute value of latitute for true solution 157*ed264d09SValeria Barra true_soln[i] = fabs(theta); 158*ed264d09SValeria Barra 159*ed264d09SValeria Barra rhs[i] = qdata[i] * true_soln[i]; 160*ed264d09SValeria Barra } // End of Quadrature Point Loop 161*ed264d09SValeria Barra 162*ed264d09SValeria Barra return 0; 163*ed264d09SValeria Barra } 164*ed264d09SValeria Barra 165*ed264d09SValeria Barra // ***************************************************************************** 166*ed264d09SValeria Barra // This QFunction applies the mass operator for a scalar field. 167*ed264d09SValeria Barra // 168*ed264d09SValeria Barra // Inputs: 169*ed264d09SValeria Barra // u - Input vector at quadrature points 170*ed264d09SValeria Barra // qdata - Geometric factors 171*ed264d09SValeria Barra // 172*ed264d09SValeria Barra // Output: 173*ed264d09SValeria Barra // v - Output vector (test functions) at quadrature points 174*ed264d09SValeria Barra // 175*ed264d09SValeria Barra // ***************************************************************************** 176*ed264d09SValeria Barra 177*ed264d09SValeria Barra // ----------------------------------------------------------------------------- 178*ed264d09SValeria Barra CEED_QFUNCTION(Mass)(void *ctx, const CeedInt Q, 179*ed264d09SValeria Barra const CeedScalar *const *in, CeedScalar *const *out) { 180*ed264d09SValeria Barra // Inputs 181*ed264d09SValeria Barra const CeedScalar *u = in[0], *qdata = in[1]; 182*ed264d09SValeria Barra // Outputs 183*ed264d09SValeria Barra CeedScalar *v = out[0]; 184*ed264d09SValeria Barra 185*ed264d09SValeria Barra // Quadrature Point Loop 186*ed264d09SValeria Barra CeedPragmaSIMD 187*ed264d09SValeria Barra for (CeedInt i=0; i<Q; i++) 188*ed264d09SValeria Barra v[i] = qdata[i] * u[i]; 189*ed264d09SValeria Barra 190*ed264d09SValeria Barra return 0; 191*ed264d09SValeria Barra } 192*ed264d09SValeria Barra // ----------------------------------------------------------------------------- 193