1*6e15d496SJeremy L Thompson /// @file 2*6e15d496SJeremy L Thompson /// Test FLOP estimation for composite mass matrix operator 3*6e15d496SJeremy L Thompson /// \test Test FLOP estimation for composite mass matrix operator 4*6e15d496SJeremy L Thompson #include <ceed.h> 5*6e15d496SJeremy L Thompson #include <stdlib.h> 6*6e15d496SJeremy L Thompson #include <math.h> 7*6e15d496SJeremy L Thompson #include "t320-basis.h" 8*6e15d496SJeremy L Thompson 9*6e15d496SJeremy L Thompson /* The mesh comprises of two rows of 3 quadralaterals followed by one row 10*6e15d496SJeremy L Thompson of 6 triangles: 11*6e15d496SJeremy L Thompson _ _ _ 12*6e15d496SJeremy L Thompson |_|_|_| 13*6e15d496SJeremy L Thompson |_|_|_| 14*6e15d496SJeremy L Thompson |/|/|/| 15*6e15d496SJeremy L Thompson 16*6e15d496SJeremy L Thompson */ 17*6e15d496SJeremy L Thompson 18*6e15d496SJeremy L Thompson int main(int argc, char **argv) { 19*6e15d496SJeremy L Thompson Ceed ceed; 20*6e15d496SJeremy L Thompson CeedInt flop_estimate; 21*6e15d496SJeremy L Thompson CeedElemRestriction elem_restr_x_tet, elem_restr_u_tet, 22*6e15d496SJeremy L Thompson elem_restr_qd_i_tet, 23*6e15d496SJeremy L Thompson elem_restr_x_hex, elem_restr_u_hex, 24*6e15d496SJeremy L Thompson elem_restr_qd_i_hex; 25*6e15d496SJeremy L Thompson CeedBasis basis_x_tet, basis_u_tet, 26*6e15d496SJeremy L Thompson basis_x_hex, basis_u_hex; 27*6e15d496SJeremy L Thompson CeedQFunction qf_mass; 28*6e15d496SJeremy L Thompson CeedOperator op_mass_tet, op_mass_hex, op_mass; 29*6e15d496SJeremy L Thompson CeedVector q_data_tet, q_data_hex; 30*6e15d496SJeremy L Thompson CeedInt num_elem_tet = 6, P_tet = 6, Q_tet = 4, 31*6e15d496SJeremy L Thompson num_elem_hex = 6, P_hex = 3, Q_hex = 4, dim = 2; 32*6e15d496SJeremy L Thompson CeedInt n_x = 3, n_y = 3, 33*6e15d496SJeremy L Thompson n_x_tet = 3, n_y_tet = 1, n_x_hex = 3; 34*6e15d496SJeremy L Thompson CeedInt row, col, offset; 35*6e15d496SJeremy L Thompson CeedInt num_dofs = (n_x*2+1)*(n_y*2+1), 36*6e15d496SJeremy L Thompson num_qpts_tet = num_elem_tet*Q_tet, 37*6e15d496SJeremy L Thompson num_qpts_hex = num_elem_hex*Q_hex*Q_hex; 38*6e15d496SJeremy L Thompson CeedInt ind_x_tet[num_elem_tet*P_tet], 39*6e15d496SJeremy L Thompson ind_x_hex[num_elem_hex*P_hex*P_hex]; 40*6e15d496SJeremy L Thompson CeedScalar q_ref[dim*Q_tet], q_weight[Q_tet]; 41*6e15d496SJeremy L Thompson CeedScalar interp[P_tet*Q_tet], grad[dim*P_tet*Q_tet]; 42*6e15d496SJeremy L Thompson 43*6e15d496SJeremy L Thompson CeedInit(argv[1], &ceed); 44*6e15d496SJeremy L Thompson 45*6e15d496SJeremy L Thompson // Qdata Vectors 46*6e15d496SJeremy L Thompson CeedVectorCreate(ceed, num_qpts_tet, &q_data_tet); 47*6e15d496SJeremy L Thompson CeedVectorCreate(ceed, num_qpts_hex, &q_data_hex); 48*6e15d496SJeremy L Thompson 49*6e15d496SJeremy L Thompson // Set up Tet Elements 50*6e15d496SJeremy L Thompson for (CeedInt i=0; i<num_elem_tet/2; i++) { 51*6e15d496SJeremy L Thompson col = i % n_x_tet; 52*6e15d496SJeremy L Thompson row = i / n_x_tet; 53*6e15d496SJeremy L Thompson offset = col*2 + row*(n_x_tet*2+1)*2; 54*6e15d496SJeremy L Thompson 55*6e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 0] = 2 + offset; 56*6e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 1] = 9 + offset; 57*6e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 2] = 16 + offset; 58*6e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 3] = 1 + offset; 59*6e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 4] = 8 + offset; 60*6e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 5] = 0 + offset; 61*6e15d496SJeremy L Thompson 62*6e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 6] = 14 + offset; 63*6e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 7] = 7 + offset; 64*6e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 8] = 0 + offset; 65*6e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 9] = 15 + offset; 66*6e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 10] = 8 + offset; 67*6e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 11] = 16 + offset; 68*6e15d496SJeremy L Thompson } 69*6e15d496SJeremy L Thompson 70*6e15d496SJeremy L Thompson // -- Restrictions 71*6e15d496SJeremy L Thompson CeedElemRestrictionCreate(ceed, num_elem_tet, P_tet, dim, num_dofs, 72*6e15d496SJeremy L Thompson dim*num_dofs, 73*6e15d496SJeremy L Thompson CEED_MEM_HOST, CEED_USE_POINTER, ind_x_tet, 74*6e15d496SJeremy L Thompson &elem_restr_x_tet); 75*6e15d496SJeremy L Thompson 76*6e15d496SJeremy L Thompson CeedElemRestrictionCreate(ceed, num_elem_tet, P_tet, 1, 1, num_dofs, 77*6e15d496SJeremy L Thompson CEED_MEM_HOST, CEED_USE_POINTER, ind_x_tet, 78*6e15d496SJeremy L Thompson &elem_restr_u_tet); 79*6e15d496SJeremy L Thompson CeedInt strides_qd_tet[3] = {1, Q_tet, Q_tet}; 80*6e15d496SJeremy L Thompson CeedElemRestrictionCreateStrided(ceed, num_elem_tet, Q_tet, 1, num_qpts_tet, 81*6e15d496SJeremy L Thompson strides_qd_tet, &elem_restr_qd_i_tet); 82*6e15d496SJeremy L Thompson 83*6e15d496SJeremy L Thompson // -- Bases 84*6e15d496SJeremy L Thompson buildmats(q_ref, q_weight, interp, grad); 85*6e15d496SJeremy L Thompson CeedBasisCreateH1(ceed, CEED_TOPOLOGY_TRIANGLE, dim, P_tet, Q_tet, interp, grad, 86*6e15d496SJeremy L Thompson q_ref, q_weight, &basis_x_tet); 87*6e15d496SJeremy L Thompson 88*6e15d496SJeremy L Thompson buildmats(q_ref, q_weight, interp, grad); 89*6e15d496SJeremy L Thompson CeedBasisCreateH1(ceed, CEED_TOPOLOGY_TRIANGLE, 1, P_tet, Q_tet, interp, grad, 90*6e15d496SJeremy L Thompson q_ref, q_weight, &basis_u_tet); 91*6e15d496SJeremy L Thompson 92*6e15d496SJeremy L Thompson // -- QFunction 93*6e15d496SJeremy L Thompson CeedQFunctionCreateInteriorByName(ceed, "MassApply", &qf_mass); 94*6e15d496SJeremy L Thompson 95*6e15d496SJeremy L Thompson // -- Operators 96*6e15d496SJeremy L Thompson // ---- Mass Tet 97*6e15d496SJeremy L Thompson CeedOperatorCreate(ceed, qf_mass, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, 98*6e15d496SJeremy L Thompson &op_mass_tet); 99*6e15d496SJeremy L Thompson CeedOperatorSetField(op_mass_tet, "u", elem_restr_u_tet, basis_u_tet, 100*6e15d496SJeremy L Thompson CEED_VECTOR_ACTIVE); 101*6e15d496SJeremy L Thompson CeedOperatorSetField(op_mass_tet, "qdata", elem_restr_qd_i_tet, 102*6e15d496SJeremy L Thompson CEED_BASIS_COLLOCATED, 103*6e15d496SJeremy L Thompson q_data_tet); 104*6e15d496SJeremy L Thompson CeedOperatorSetField(op_mass_tet, "v", elem_restr_u_tet, basis_u_tet, 105*6e15d496SJeremy L Thompson CEED_VECTOR_ACTIVE); 106*6e15d496SJeremy L Thompson 107*6e15d496SJeremy L Thompson // Set up Hex Elements 108*6e15d496SJeremy L Thompson for (CeedInt i=0; i<num_elem_hex; i++) { 109*6e15d496SJeremy L Thompson col = i % n_x_hex; 110*6e15d496SJeremy L Thompson row = i / n_x_hex; 111*6e15d496SJeremy L Thompson offset = (n_x_tet*2+1)*(n_y_tet*2)*(1+row) + col*2; 112*6e15d496SJeremy L Thompson for (CeedInt j=0; j<P_hex; j++) 113*6e15d496SJeremy L Thompson for (CeedInt k=0; k<P_hex; k++) 114*6e15d496SJeremy L Thompson ind_x_hex[P_hex*(P_hex*i+k)+j] = offset + k*(n_x_hex*2+1) + j; 115*6e15d496SJeremy L Thompson } 116*6e15d496SJeremy L Thompson 117*6e15d496SJeremy L Thompson // -- Restrictions 118*6e15d496SJeremy L Thompson CeedElemRestrictionCreate(ceed, num_elem_hex, P_hex*P_hex, dim, num_dofs, 119*6e15d496SJeremy L Thompson dim*num_dofs, 120*6e15d496SJeremy L Thompson CEED_MEM_HOST, CEED_USE_POINTER, ind_x_hex, 121*6e15d496SJeremy L Thompson &elem_restr_x_hex); 122*6e15d496SJeremy L Thompson 123*6e15d496SJeremy L Thompson CeedElemRestrictionCreate(ceed, num_elem_hex, P_hex*P_hex, 1, 1, num_dofs, 124*6e15d496SJeremy L Thompson CEED_MEM_HOST, CEED_USE_POINTER, ind_x_hex, 125*6e15d496SJeremy L Thompson &elem_restr_u_hex); 126*6e15d496SJeremy L Thompson CeedInt strides_qd_hex[3] = {1, Q_hex*Q_hex, Q_hex*Q_hex}; 127*6e15d496SJeremy L Thompson CeedElemRestrictionCreateStrided(ceed, num_elem_hex, Q_hex*Q_hex, 1, 128*6e15d496SJeremy L Thompson num_qpts_hex, 129*6e15d496SJeremy L Thompson strides_qd_hex, &elem_restr_qd_i_hex); 130*6e15d496SJeremy L Thompson 131*6e15d496SJeremy L Thompson // -- Bases 132*6e15d496SJeremy L Thompson CeedBasisCreateTensorH1Lagrange(ceed, dim, dim, P_hex, Q_hex, CEED_GAUSS, 133*6e15d496SJeremy L Thompson &basis_x_hex); 134*6e15d496SJeremy L Thompson CeedBasisCreateTensorH1Lagrange(ceed, dim, 1, P_hex, Q_hex, CEED_GAUSS, 135*6e15d496SJeremy L Thompson &basis_u_hex); 136*6e15d496SJeremy L Thompson 137*6e15d496SJeremy L Thompson // -- Operators 138*6e15d496SJeremy L Thompson CeedOperatorCreate(ceed, qf_mass, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, 139*6e15d496SJeremy L Thompson &op_mass_hex); 140*6e15d496SJeremy L Thompson CeedOperatorSetField(op_mass_hex, "u", elem_restr_u_hex, basis_u_hex, 141*6e15d496SJeremy L Thompson CEED_VECTOR_ACTIVE); 142*6e15d496SJeremy L Thompson CeedOperatorSetField(op_mass_hex, "qdata", elem_restr_qd_i_hex, 143*6e15d496SJeremy L Thompson CEED_BASIS_COLLOCATED, 144*6e15d496SJeremy L Thompson q_data_hex); 145*6e15d496SJeremy L Thompson CeedOperatorSetField(op_mass_hex, "v", elem_restr_u_hex, basis_u_hex, 146*6e15d496SJeremy L Thompson CEED_VECTOR_ACTIVE); 147*6e15d496SJeremy L Thompson 148*6e15d496SJeremy L Thompson // Set up Composite Operator 149*6e15d496SJeremy L Thompson // -- Create 150*6e15d496SJeremy L Thompson CeedCompositeOperatorCreate(ceed, &op_mass); 151*6e15d496SJeremy L Thompson // -- Add SubOperators 152*6e15d496SJeremy L Thompson CeedCompositeOperatorAddSub(op_mass, op_mass_tet); 153*6e15d496SJeremy L Thompson CeedCompositeOperatorAddSub(op_mass, op_mass_hex); 154*6e15d496SJeremy L Thompson 155*6e15d496SJeremy L Thompson // Estimate FLOPs 156*6e15d496SJeremy L Thompson CeedQFunctionSetUserFlopsEstimate(qf_mass, 1); 157*6e15d496SJeremy L Thompson CeedOperatorGetFlopsEstimate(op_mass, &flop_estimate); 158*6e15d496SJeremy L Thompson 159*6e15d496SJeremy L Thompson // Check output 160*6e15d496SJeremy L Thompson if (flop_estimate != 3042) 161*6e15d496SJeremy L Thompson // LCOV_EXCL_START 162*6e15d496SJeremy L Thompson printf("Incorrect FLOP estimate computed, %d != 3042\n", flop_estimate); 163*6e15d496SJeremy L Thompson // LOCV_EXCL_STOP 164*6e15d496SJeremy L Thompson 165*6e15d496SJeremy L Thompson // Cleanup 166*6e15d496SJeremy L Thompson CeedQFunctionDestroy(&qf_mass); 167*6e15d496SJeremy L Thompson CeedOperatorDestroy(&op_mass_tet); 168*6e15d496SJeremy L Thompson CeedOperatorDestroy(&op_mass_hex); 169*6e15d496SJeremy L Thompson CeedOperatorDestroy(&op_mass); 170*6e15d496SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_u_tet); 171*6e15d496SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_x_tet); 172*6e15d496SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_qd_i_tet); 173*6e15d496SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_u_hex); 174*6e15d496SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_x_hex); 175*6e15d496SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_qd_i_hex); 176*6e15d496SJeremy L Thompson CeedBasisDestroy(&basis_u_tet); 177*6e15d496SJeremy L Thompson CeedBasisDestroy(&basis_x_tet); 178*6e15d496SJeremy L Thompson CeedBasisDestroy(&basis_u_hex); 179*6e15d496SJeremy L Thompson CeedBasisDestroy(&basis_x_hex); 180*6e15d496SJeremy L Thompson CeedVectorDestroy(&q_data_tet); 181*6e15d496SJeremy L Thompson CeedVectorDestroy(&q_data_hex); 182*6e15d496SJeremy L Thompson CeedDestroy(&ceed); 183*6e15d496SJeremy L Thompson return 0; 184*6e15d496SJeremy L Thompson } 185