1cb32e2e7SValeria Barra // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at 2cb32e2e7SValeria Barra // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights 3cb32e2e7SValeria Barra // reserved. See files LICENSE and NOTICE for details. 4cb32e2e7SValeria Barra // 5cb32e2e7SValeria Barra // This file is part of CEED, a collection of benchmarks, miniapps, software 6cb32e2e7SValeria Barra // libraries and APIs for efficient high-order finite element and spectral 7cb32e2e7SValeria Barra // element discretizations for exascale applications. For more information and 8cb32e2e7SValeria Barra // source code availability see http://github.com/ceed. 9cb32e2e7SValeria Barra // 10cb32e2e7SValeria Barra // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 11cb32e2e7SValeria Barra // a collaborative effort of two U.S. Department of Energy organizations (Office 12cb32e2e7SValeria Barra // of Science and the National Nuclear Security Administration) responsible for 13cb32e2e7SValeria Barra // the planning and preparation of a capable exascale ecosystem, including 14cb32e2e7SValeria Barra // software, applications, hardware, advanced system engineering and early 15cb32e2e7SValeria Barra // testbed platforms, in support of the nation's exascale computing imperative. 16cb32e2e7SValeria Barra 17cb32e2e7SValeria Barra /// @file 18cb32e2e7SValeria Barra /// libCEED QFunctions for diffusion operator example using PETSc 19cb32e2e7SValeria Barra 20f6b55d2cSvaleriabarra #ifndef bp4_h 21f6b55d2cSvaleriabarra #define bp4_h 22f6b55d2cSvaleriabarra 23f6b55d2cSvaleriabarra #ifndef __CUDACC__ 24f6b55d2cSvaleriabarra # include <math.h> 25f6b55d2cSvaleriabarra #endif 26f6b55d2cSvaleriabarra 27e83e87a5Sjeremylt // ----------------------------------------------------------------------------- 2813921685Svaleriabarra // This QFunction sets up the rhs and true solution for the problem 29cb32e2e7SValeria Barra // ----------------------------------------------------------------------------- 30cb32e2e7SValeria Barra CEED_QFUNCTION(SetupDiffRhs3)(void *ctx, CeedInt Q, 31cb32e2e7SValeria Barra const CeedScalar *const *in, 32cb32e2e7SValeria Barra CeedScalar *const *out) { 33cb32e2e7SValeria Barra #ifndef M_PI 34cb32e2e7SValeria Barra # define M_PI 3.14159265358979323846 35cb32e2e7SValeria Barra #endif 36e83e87a5Sjeremylt const CeedScalar *x = in[0], *w = in[1]; 37cb32e2e7SValeria Barra CeedScalar *true_soln = out[0], *rhs = out[1]; 38cb32e2e7SValeria Barra 39cb32e2e7SValeria Barra // Quadrature Point Loop 40cb32e2e7SValeria Barra CeedPragmaSIMD 41cb32e2e7SValeria Barra for (CeedInt i=0; i<Q; i++) { 42cb32e2e7SValeria Barra const CeedScalar c[3] = { 0, 1., 2. }; 43cb32e2e7SValeria Barra const CeedScalar k[3] = { 1., 2., 3. }; 44cb32e2e7SValeria Barra 45cb32e2e7SValeria Barra // Component 1 46cb32e2e7SValeria Barra true_soln[i+0*Q] = sin(M_PI*(c[0] + k[0]*x[i+Q*0])) * 47cb32e2e7SValeria Barra sin(M_PI*(c[1] + k[1]*x[i+Q*1])) * 48cb32e2e7SValeria Barra sin(M_PI*(c[2] + k[2]*x[i+Q*2])); 49cb32e2e7SValeria Barra // Component 2 5082311801Sjeremylt true_soln[i+1*Q] = 2 * true_soln[i+0*Q]; 51cb32e2e7SValeria Barra // Component 3 5282311801Sjeremylt true_soln[i+2*Q] = 3 * true_soln[i+0*Q]; 53cb32e2e7SValeria Barra 54cb32e2e7SValeria Barra // Component 1 55e83e87a5Sjeremylt rhs[i+0*Q] = w[i+Q*6] * M_PI*M_PI * (k[0]*k[0] + k[1]*k[1] + k[2]*k[2]) * 56cb32e2e7SValeria Barra true_soln[i+0*Q]; 57cb32e2e7SValeria Barra // Component 2 5882311801Sjeremylt rhs[i+1*Q] = 2 * rhs[i+0*Q]; 59cb32e2e7SValeria Barra // Component 3 6082311801Sjeremylt rhs[i+2*Q] = 3 * rhs[i+0*Q]; 61cb32e2e7SValeria Barra } // End of Quadrature Point Loop 62cb32e2e7SValeria Barra 63cb32e2e7SValeria Barra return 0; 64cb32e2e7SValeria Barra } 65cb32e2e7SValeria Barra 66e83e87a5Sjeremylt // ----------------------------------------------------------------------------- 67ed264d09SValeria Barra // This QFunction applies the diffusion operator for a vector field of 3 components. 68ed264d09SValeria Barra // 69ed264d09SValeria Barra // Inputs: 70ed264d09SValeria Barra // ug - Input vector Jacobian at quadrature points 71*9b072555Sjeremylt // q_data - Geometric factors 72ed264d09SValeria Barra // 73ed264d09SValeria Barra // Output: 74ed264d09SValeria Barra // vJ - Output vector (test functions) Jacobian at quadrature points 75ed264d09SValeria Barra // 76cb32e2e7SValeria Barra // ----------------------------------------------------------------------------- 77cb32e2e7SValeria Barra CEED_QFUNCTION(Diff3)(void *ctx, CeedInt Q, 78cb32e2e7SValeria Barra const CeedScalar *const *in, CeedScalar *const *out) { 79cb32e2e7SValeria Barra const CeedScalar *ug = in[0], *qd = in[1]; 80cb32e2e7SValeria Barra CeedScalar *vg = out[0]; 81cb32e2e7SValeria Barra 82cb32e2e7SValeria Barra // Quadrature Point Loop 83cb32e2e7SValeria Barra CeedPragmaSIMD 84cb32e2e7SValeria Barra for (CeedInt i=0; i<Q; i++) { 85cb32e2e7SValeria Barra // Read spatial derivatives of u components 86cb32e2e7SValeria Barra const CeedScalar uJ[3][3] = {{ug[i+(0+0*3)*Q], 87cb32e2e7SValeria Barra ug[i+(0+1*3)*Q], 88cb32e2e7SValeria Barra ug[i+(0+2*3)*Q]}, 89cb32e2e7SValeria Barra {ug[i+(1+0*3)*Q], 90cb32e2e7SValeria Barra ug[i+(1+1*3)*Q], 91cb32e2e7SValeria Barra ug[i+(1+2*3)*Q]}, 92cb32e2e7SValeria Barra {ug[i+(2+0*3)*Q], 93cb32e2e7SValeria Barra ug[i+(2+1*3)*Q], 94cb32e2e7SValeria Barra ug[i+(2+2*3)*Q]} 95cb32e2e7SValeria Barra }; 96*9b072555Sjeremylt // Read q_data (dXdxdXdx_T symmetric matrix) 97*9b072555Sjeremylt const CeedScalar dXdxdXdx_T[3][3] = {{qd[i+0*Q], 98cb32e2e7SValeria Barra qd[i+1*Q], 99cb32e2e7SValeria Barra qd[i+2*Q]}, 100cb32e2e7SValeria Barra {qd[i+1*Q], 101cb32e2e7SValeria Barra qd[i+3*Q], 102cb32e2e7SValeria Barra qd[i+4*Q]}, 103cb32e2e7SValeria Barra {qd[i+2*Q], 104cb32e2e7SValeria Barra qd[i+4*Q], 105cb32e2e7SValeria Barra qd[i+5*Q]} 106cb32e2e7SValeria Barra }; 107cb32e2e7SValeria Barra 108cb32e2e7SValeria Barra for (int k=0; k<3; k++) // k = component 109cb32e2e7SValeria Barra for (int j=0; j<3; j++) // j = direction of vg 110*9b072555Sjeremylt vg[i+(k+j*3)*Q] = (uJ[k][0] * dXdxdXdx_T[0][j] + 111*9b072555Sjeremylt uJ[k][1] * dXdxdXdx_T[1][j] + 112*9b072555Sjeremylt uJ[k][2] * dXdxdXdx_T[2][j]); 113cb32e2e7SValeria Barra } // End of Quadrature Point Loop 114cb32e2e7SValeria Barra 115cb32e2e7SValeria Barra return 0; 116cb32e2e7SValeria Barra } 117cb32e2e7SValeria Barra // ----------------------------------------------------------------------------- 118f6b55d2cSvaleriabarra 119f6b55d2cSvaleriabarra #endif // bp4_h 120