1*437c7c90SJeremy L Thompson /// @file 2*437c7c90SJeremy L Thompson /// Test assembly of operator diagonal for operator with multiple active bases 3*437c7c90SJeremy L Thompson /// \test Test assembly of operator diagonal for operator with multiple active bases 4*437c7c90SJeremy L Thompson #include "t539-operator.h" 5*437c7c90SJeremy L Thompson 6*437c7c90SJeremy L Thompson #include <ceed.h> 7*437c7c90SJeremy L Thompson #include <math.h> 8*437c7c90SJeremy L Thompson #include <stdlib.h> 9*437c7c90SJeremy L Thompson 10*437c7c90SJeremy L Thompson int main(int argc, char **argv) { 11*437c7c90SJeremy L Thompson Ceed ceed; 12*437c7c90SJeremy L Thompson CeedElemRestriction elem_restr_x, elem_restr_u_0, elem_restr_u_1, elem_restr_qd_mass, elem_restr_qd_diff; 13*437c7c90SJeremy L Thompson CeedBasis basis_x, basis_u_0, basis_u_1; 14*437c7c90SJeremy L Thompson CeedQFunction qf_setup_mass, qf_setup_diff, qf_apply; 15*437c7c90SJeremy L Thompson CeedOperator op_setup_mass, op_setup_diff, op_apply; 16*437c7c90SJeremy L Thompson CeedVector q_data_mass, q_data_diff, X, A, U, V; 17*437c7c90SJeremy L Thompson CeedInt num_elem = 6, P_0 = 2, P_1 = 3, Q = 4, dim = 2, num_comp_0 = 2, num_comp_1 = 1; 18*437c7c90SJeremy L Thompson CeedInt nx = 3, ny = 2; 19*437c7c90SJeremy L Thompson CeedInt num_dofs_0 = (nx * (P_0 - 1) + 1) * (ny * (P_0 - 1) + 1), num_dofs_1 = (nx * (P_1 - 1) + 1) * (ny * (P_1 - 1) + 1); 20*437c7c90SJeremy L Thompson CeedInt num_qpts = num_elem * Q * Q; 21*437c7c90SJeremy L Thompson CeedInt ind_u_0[num_elem * P_0 * P_0], ind_u_1[num_elem * P_1 * P_1]; 22*437c7c90SJeremy L Thompson CeedScalar x[dim * num_dofs_0], assembled_true[num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1]; 23*437c7c90SJeremy L Thompson CeedScalar *u; 24*437c7c90SJeremy L Thompson const CeedScalar *a, *v; 25*437c7c90SJeremy L Thompson 26*437c7c90SJeremy L Thompson CeedInit(argv[1], &ceed); 27*437c7c90SJeremy L Thompson 28*437c7c90SJeremy L Thompson // DoF Coordinates 29*437c7c90SJeremy L Thompson for (CeedInt i = 0; i < nx * 2 + 1; i++) { 30*437c7c90SJeremy L Thompson for (CeedInt j = 0; j < ny * 2 + 1; j++) { 31*437c7c90SJeremy L Thompson x[i + j * (nx * 2 + 1) + 0 * num_dofs_0] = (CeedScalar)i / (2 * nx); 32*437c7c90SJeremy L Thompson x[i + j * (nx * 2 + 1) + 1 * num_dofs_0] = (CeedScalar)j / (2 * ny); 33*437c7c90SJeremy L Thompson } 34*437c7c90SJeremy L Thompson } 35*437c7c90SJeremy L Thompson CeedVectorCreate(ceed, dim * num_dofs_0, &X); 36*437c7c90SJeremy L Thompson CeedVectorSetArray(X, CEED_MEM_HOST, CEED_USE_POINTER, x); 37*437c7c90SJeremy L Thompson 38*437c7c90SJeremy L Thompson // Qdata Vectors 39*437c7c90SJeremy L Thompson CeedVectorCreate(ceed, num_qpts, &q_data_mass); 40*437c7c90SJeremy L Thompson CeedVectorCreate(ceed, num_qpts * dim * (dim + 1) / 2, &q_data_diff); 41*437c7c90SJeremy L Thompson 42*437c7c90SJeremy L Thompson // Element Setup 43*437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_elem; i++) { 44*437c7c90SJeremy L Thompson CeedInt col, row, offset; 45*437c7c90SJeremy L Thompson col = i % nx; 46*437c7c90SJeremy L Thompson row = i / nx; 47*437c7c90SJeremy L Thompson offset = col * (P_0 - 1) + row * (nx * (P_0 - 1) + 1) * (P_0 - 1); 48*437c7c90SJeremy L Thompson for (CeedInt j = 0; j < P_0; j++) { 49*437c7c90SJeremy L Thompson for (CeedInt k = 0; k < P_0; k++) ind_u_0[P_0 * (P_0 * i + k) + j] = offset + k * (nx * (P_0 - 1) + 1) + j; 50*437c7c90SJeremy L Thompson } 51*437c7c90SJeremy L Thompson offset = col * (P_1 - 1) + row * (nx * (P_1 - 1) + 1) * (P_1 - 1) + num_dofs_0 * num_comp_0; 52*437c7c90SJeremy L Thompson for (CeedInt j = 0; j < P_1; j++) { 53*437c7c90SJeremy L Thompson for (CeedInt k = 0; k < P_1; k++) ind_u_1[P_1 * (P_1 * i + k) + j] = offset + k * (nx * (P_1 - 1) + 1) + j; 54*437c7c90SJeremy L Thompson } 55*437c7c90SJeremy L Thompson } 56*437c7c90SJeremy L Thompson 57*437c7c90SJeremy L Thompson // Restrictions 58*437c7c90SJeremy L Thompson CeedElemRestrictionCreate(ceed, num_elem, P_0 * P_0, dim, num_dofs_0, dim * num_dofs_0, CEED_MEM_HOST, CEED_USE_POINTER, ind_u_0, &elem_restr_x); 59*437c7c90SJeremy L Thompson CeedElemRestrictionCreate(ceed, num_elem, P_0 * P_0, num_comp_0, num_dofs_0, num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1, CEED_MEM_HOST, 60*437c7c90SJeremy L Thompson CEED_USE_POINTER, ind_u_0, &elem_restr_u_0); 61*437c7c90SJeremy L Thompson CeedElemRestrictionCreate(ceed, num_elem, P_1 * P_1, num_comp_1, num_dofs_1, num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1, CEED_MEM_HOST, 62*437c7c90SJeremy L Thompson CEED_USE_POINTER, ind_u_1, &elem_restr_u_1); 63*437c7c90SJeremy L Thompson CeedInt strides_qd_mass[3] = {1, Q * Q, Q * Q}; 64*437c7c90SJeremy L Thompson CeedElemRestrictionCreateStrided(ceed, num_elem, Q * Q, 1, num_qpts, strides_qd_mass, &elem_restr_qd_mass); 65*437c7c90SJeremy L Thompson CeedInt strides_qd_diff[3] = {1, Q * Q, dim * (dim + 1) / 2 * Q * Q}; 66*437c7c90SJeremy L Thompson CeedElemRestrictionCreateStrided(ceed, num_elem, Q * Q, dim * (dim + 1) / 2, dim * (dim + 1) / 2 * num_qpts, strides_qd_diff, &elem_restr_qd_diff); 67*437c7c90SJeremy L Thompson 68*437c7c90SJeremy L Thompson // Bases 69*437c7c90SJeremy L Thompson CeedBasisCreateTensorH1Lagrange(ceed, dim, dim, P_0, Q, CEED_GAUSS, &basis_x); 70*437c7c90SJeremy L Thompson CeedBasisCreateTensorH1Lagrange(ceed, dim, num_comp_0, P_0, Q, CEED_GAUSS, &basis_u_0); 71*437c7c90SJeremy L Thompson CeedBasisCreateTensorH1Lagrange(ceed, dim, num_comp_1, P_1, Q, CEED_GAUSS, &basis_u_1); 72*437c7c90SJeremy L Thompson 73*437c7c90SJeremy L Thompson // QFunction - setup mass 74*437c7c90SJeremy L Thompson CeedQFunctionCreateInteriorByName(ceed, "Mass2DBuild", &qf_setup_mass); 75*437c7c90SJeremy L Thompson 76*437c7c90SJeremy L Thompson // Operator - setup mass 77*437c7c90SJeremy L Thompson CeedOperatorCreate(ceed, qf_setup_mass, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, &op_setup_mass); 78*437c7c90SJeremy L Thompson CeedOperatorSetField(op_setup_mass, "dx", elem_restr_x, basis_x, CEED_VECTOR_ACTIVE); 79*437c7c90SJeremy L Thompson CeedOperatorSetField(op_setup_mass, "weights", CEED_ELEMRESTRICTION_NONE, basis_x, CEED_VECTOR_NONE); 80*437c7c90SJeremy L Thompson CeedOperatorSetField(op_setup_mass, "qdata", elem_restr_qd_mass, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE); 81*437c7c90SJeremy L Thompson 82*437c7c90SJeremy L Thompson // QFunction - setup diffusion 83*437c7c90SJeremy L Thompson CeedQFunctionCreateInteriorByName(ceed, "Poisson2DBuild", &qf_setup_diff); 84*437c7c90SJeremy L Thompson 85*437c7c90SJeremy L Thompson // Operator - setup diffusion 86*437c7c90SJeremy L Thompson CeedOperatorCreate(ceed, qf_setup_diff, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, &op_setup_diff); 87*437c7c90SJeremy L Thompson CeedOperatorSetField(op_setup_diff, "dx", elem_restr_x, basis_x, CEED_VECTOR_ACTIVE); 88*437c7c90SJeremy L Thompson CeedOperatorSetField(op_setup_diff, "weights", CEED_ELEMRESTRICTION_NONE, basis_x, CEED_VECTOR_NONE); 89*437c7c90SJeremy L Thompson CeedOperatorSetField(op_setup_diff, "qdata", elem_restr_qd_diff, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE); 90*437c7c90SJeremy L Thompson 91*437c7c90SJeremy L Thompson // Apply Setup Operators 92*437c7c90SJeremy L Thompson CeedOperatorApply(op_setup_mass, X, q_data_mass, CEED_REQUEST_IMMEDIATE); 93*437c7c90SJeremy L Thompson CeedOperatorApply(op_setup_diff, X, q_data_diff, CEED_REQUEST_IMMEDIATE); 94*437c7c90SJeremy L Thompson 95*437c7c90SJeremy L Thompson // QFunction - apply 96*437c7c90SJeremy L Thompson CeedQFunctionCreateInterior(ceed, 1, apply, apply_loc, &qf_apply); 97*437c7c90SJeremy L Thompson CeedQFunctionAddInput(qf_apply, "du_0", num_comp_0 * dim, CEED_EVAL_GRAD); 98*437c7c90SJeremy L Thompson CeedQFunctionAddInput(qf_apply, "mass qdata", 1, CEED_EVAL_NONE); 99*437c7c90SJeremy L Thompson CeedQFunctionAddInput(qf_apply, "diff qdata", dim * (dim + 1) / 2, CEED_EVAL_NONE); 100*437c7c90SJeremy L Thompson CeedQFunctionAddInput(qf_apply, "u_0", num_comp_0, CEED_EVAL_INTERP); 101*437c7c90SJeremy L Thompson CeedQFunctionAddInput(qf_apply, "u_1", num_comp_1, CEED_EVAL_INTERP); 102*437c7c90SJeremy L Thompson CeedQFunctionAddOutput(qf_apply, "v_0", num_comp_0, CEED_EVAL_INTERP); 103*437c7c90SJeremy L Thompson CeedQFunctionAddOutput(qf_apply, "v_1", num_comp_1, CEED_EVAL_INTERP); 104*437c7c90SJeremy L Thompson CeedQFunctionAddOutput(qf_apply, "dv_0", num_comp_0 * dim, CEED_EVAL_GRAD); 105*437c7c90SJeremy L Thompson 106*437c7c90SJeremy L Thompson // Operator - apply 107*437c7c90SJeremy L Thompson CeedOperatorCreate(ceed, qf_apply, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, &op_apply); 108*437c7c90SJeremy L Thompson CeedOperatorSetField(op_apply, "du_0", elem_restr_u_0, basis_u_0, CEED_VECTOR_ACTIVE); 109*437c7c90SJeremy L Thompson CeedOperatorSetField(op_apply, "mass qdata", elem_restr_qd_mass, CEED_BASIS_COLLOCATED, q_data_mass); 110*437c7c90SJeremy L Thompson CeedOperatorSetField(op_apply, "diff qdata", elem_restr_qd_diff, CEED_BASIS_COLLOCATED, q_data_diff); 111*437c7c90SJeremy L Thompson CeedOperatorSetField(op_apply, "u_0", elem_restr_u_0, basis_u_0, CEED_VECTOR_ACTIVE); 112*437c7c90SJeremy L Thompson CeedOperatorSetField(op_apply, "u_1", elem_restr_u_1, basis_u_1, CEED_VECTOR_ACTIVE); 113*437c7c90SJeremy L Thompson CeedOperatorSetField(op_apply, "v_0", elem_restr_u_0, basis_u_0, CEED_VECTOR_ACTIVE); 114*437c7c90SJeremy L Thompson CeedOperatorSetField(op_apply, "v_1", elem_restr_u_1, basis_u_1, CEED_VECTOR_ACTIVE); 115*437c7c90SJeremy L Thompson CeedOperatorSetField(op_apply, "dv_0", elem_restr_u_0, basis_u_0, CEED_VECTOR_ACTIVE); 116*437c7c90SJeremy L Thompson 117*437c7c90SJeremy L Thompson // Assemble diagonal 118*437c7c90SJeremy L Thompson CeedVectorCreate(ceed, num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1, &A); 119*437c7c90SJeremy L Thompson CeedOperatorLinearAssembleDiagonal(op_apply, A, CEED_REQUEST_IMMEDIATE); 120*437c7c90SJeremy L Thompson 121*437c7c90SJeremy L Thompson // Manually assemble diagonal 122*437c7c90SJeremy L Thompson CeedVectorCreate(ceed, num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1, &U); 123*437c7c90SJeremy L Thompson CeedVectorSetValue(U, 0.0); 124*437c7c90SJeremy L Thompson CeedVectorCreate(ceed, num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1, &V); 125*437c7c90SJeremy L Thompson for (int i = 0; i < num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1; i++) assembled_true[i] = 0.0; 126*437c7c90SJeremy L Thompson for (int i = 0; i < num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1; i++) { 127*437c7c90SJeremy L Thompson // Set input 128*437c7c90SJeremy L Thompson CeedVectorGetArray(U, CEED_MEM_HOST, &u); 129*437c7c90SJeremy L Thompson u[i] = 1.0; 130*437c7c90SJeremy L Thompson if (i) u[i - 1] = 0.0; 131*437c7c90SJeremy L Thompson CeedVectorRestoreArray(U, &u); 132*437c7c90SJeremy L Thompson 133*437c7c90SJeremy L Thompson // Compute diag entry for DoF i 134*437c7c90SJeremy L Thompson CeedOperatorApply(op_apply, U, V, CEED_REQUEST_IMMEDIATE); 135*437c7c90SJeremy L Thompson 136*437c7c90SJeremy L Thompson // Retrieve entry 137*437c7c90SJeremy L Thompson CeedVectorGetArrayRead(V, CEED_MEM_HOST, &v); 138*437c7c90SJeremy L Thompson assembled_true[i] = v[i]; 139*437c7c90SJeremy L Thompson CeedVectorRestoreArrayRead(V, &v); 140*437c7c90SJeremy L Thompson } 141*437c7c90SJeremy L Thompson 142*437c7c90SJeremy L Thompson // Check output 143*437c7c90SJeremy L Thompson CeedVectorGetArrayRead(A, CEED_MEM_HOST, &a); 144*437c7c90SJeremy L Thompson for (int i = 0; i < num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1; i++) { 145*437c7c90SJeremy L Thompson if (fabs(a[i] - assembled_true[i]) > 1000. * CEED_EPSILON) printf("[%" CeedInt_FMT "] Error in assembly: %f != %f\n", i, a[i], assembled_true[i]); 146*437c7c90SJeremy L Thompson } 147*437c7c90SJeremy L Thompson CeedVectorRestoreArrayRead(A, &a); 148*437c7c90SJeremy L Thompson 149*437c7c90SJeremy L Thompson // Cleanup 150*437c7c90SJeremy L Thompson CeedQFunctionDestroy(&qf_setup_mass); 151*437c7c90SJeremy L Thompson CeedQFunctionDestroy(&qf_setup_diff); 152*437c7c90SJeremy L Thompson CeedQFunctionDestroy(&qf_apply); 153*437c7c90SJeremy L Thompson CeedOperatorDestroy(&op_setup_mass); 154*437c7c90SJeremy L Thompson CeedOperatorDestroy(&op_setup_diff); 155*437c7c90SJeremy L Thompson CeedOperatorDestroy(&op_apply); 156*437c7c90SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_x); 157*437c7c90SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_u_0); 158*437c7c90SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_u_1); 159*437c7c90SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_qd_mass); 160*437c7c90SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_qd_diff); 161*437c7c90SJeremy L Thompson CeedBasisDestroy(&basis_x); 162*437c7c90SJeremy L Thompson CeedBasisDestroy(&basis_u_0); 163*437c7c90SJeremy L Thompson CeedBasisDestroy(&basis_u_1); 164*437c7c90SJeremy L Thompson CeedVectorDestroy(&q_data_mass); 165*437c7c90SJeremy L Thompson CeedVectorDestroy(&q_data_diff); 166*437c7c90SJeremy L Thompson CeedVectorDestroy(&X); 167*437c7c90SJeremy L Thompson CeedVectorDestroy(&A); 168*437c7c90SJeremy L Thompson CeedVectorDestroy(&U); 169*437c7c90SJeremy L Thompson CeedVectorDestroy(&V); 170*437c7c90SJeremy L Thompson CeedDestroy(&ceed); 171*437c7c90SJeremy L Thompson return 0; 172*437c7c90SJeremy L Thompson } 173