1*038a8942SZach Atkins /// @file 2*038a8942SZach Atkins /// Test gradient transpose in multiple dimensions at arbitrary points 3*038a8942SZach Atkins /// \test Test gradient transpose in multiple dimensions at arbitrary points 4*038a8942SZach Atkins #include <ceed.h> 5*038a8942SZach Atkins #include <math.h> 6*038a8942SZach Atkins #include <stdio.h> 7*038a8942SZach Atkins 8*038a8942SZach Atkins static CeedScalar Eval(CeedInt dim, const CeedScalar x[]) { 9*038a8942SZach Atkins CeedScalar result = tanh(x[0] + 0.1); 10*038a8942SZach Atkins if (dim > 1) result += atan(x[1] + 0.2); 11*038a8942SZach Atkins if (dim > 2) result += exp(-(x[2] + 0.3) * (x[2] + 0.3)); 12*038a8942SZach Atkins return result; 13*038a8942SZach Atkins } 14*038a8942SZach Atkins 15*038a8942SZach Atkins static CeedScalar GetTolerance(CeedScalarType scalar_type, int dim) { 16*038a8942SZach Atkins CeedScalar tol; 17*038a8942SZach Atkins if (scalar_type == CEED_SCALAR_FP32) { 18*038a8942SZach Atkins if (dim == 3) tol = 0.005; 19*038a8942SZach Atkins else tol = 1.e-4; 20*038a8942SZach Atkins } else { 21*038a8942SZach Atkins tol = 1.e-11; 22*038a8942SZach Atkins } 23*038a8942SZach Atkins return tol; 24*038a8942SZach Atkins } 25*038a8942SZach Atkins 26*038a8942SZach Atkins int main(int argc, char **argv) { 27*038a8942SZach Atkins Ceed ceed; 28*038a8942SZach Atkins 29*038a8942SZach Atkins CeedInit(argv[1], &ceed); 30*038a8942SZach Atkins 31*038a8942SZach Atkins for (CeedInt dim = 1; dim <= 3; dim++) { 32*038a8942SZach Atkins CeedVector x, x_nodes, x_points, u, u_points, v, ones; 33*038a8942SZach Atkins CeedBasis basis_x, basis_u; 34*038a8942SZach Atkins const CeedInt p = 9, q = 9, num_points = 4, x_dim = CeedIntPow(2, dim), p_dim = CeedIntPow(p, dim); 35*038a8942SZach Atkins CeedScalar sum_1 = 0, sum_2 = 0; 36*038a8942SZach Atkins 37*038a8942SZach Atkins CeedVectorCreate(ceed, x_dim * dim, &x); 38*038a8942SZach Atkins CeedVectorCreate(ceed, p_dim * dim, &x_nodes); 39*038a8942SZach Atkins CeedVectorCreate(ceed, num_points * dim, &x_points); 40*038a8942SZach Atkins CeedVectorCreate(ceed, p_dim, &u); 41*038a8942SZach Atkins CeedVectorCreate(ceed, num_points * dim, &u_points); 42*038a8942SZach Atkins CeedVectorCreate(ceed, p_dim, &v); 43*038a8942SZach Atkins CeedVectorCreate(ceed, num_points * dim, &ones); 44*038a8942SZach Atkins 45*038a8942SZach Atkins CeedVectorSetValue(ones, 1); 46*038a8942SZach Atkins CeedVectorSetValue(v, 0); 47*038a8942SZach Atkins 48*038a8942SZach Atkins // Get nodal coordinates 49*038a8942SZach Atkins CeedBasisCreateTensorH1Lagrange(ceed, dim, dim, 2, p, CEED_GAUSS_LOBATTO, &basis_x); 50*038a8942SZach Atkins { 51*038a8942SZach Atkins CeedScalar x_array[x_dim * dim]; 52*038a8942SZach Atkins 53*038a8942SZach Atkins for (CeedInt d = 0; d < dim; d++) { 54*038a8942SZach Atkins for (CeedInt i = 0; i < x_dim; i++) x_array[d * x_dim + i] = (i % CeedIntPow(2, d + 1)) / CeedIntPow(2, d) ? 1 : -1; 55*038a8942SZach Atkins } 56*038a8942SZach Atkins CeedVectorSetArray(x, CEED_MEM_HOST, CEED_COPY_VALUES, x_array); 57*038a8942SZach Atkins } 58*038a8942SZach Atkins CeedBasisApply(basis_x, 1, CEED_NOTRANSPOSE, CEED_EVAL_INTERP, x, x_nodes); 59*038a8942SZach Atkins 60*038a8942SZach Atkins // Set values of u at nodes 61*038a8942SZach Atkins { 62*038a8942SZach Atkins const CeedScalar *x_array; 63*038a8942SZach Atkins CeedScalar u_array[p_dim]; 64*038a8942SZach Atkins 65*038a8942SZach Atkins CeedVectorGetArrayRead(x_nodes, CEED_MEM_HOST, &x_array); 66*038a8942SZach Atkins for (CeedInt i = 0; i < p_dim; i++) { 67*038a8942SZach Atkins CeedScalar coord[dim]; 68*038a8942SZach Atkins 69*038a8942SZach Atkins for (CeedInt d = 0; d < dim; d++) coord[d] = x_array[d * p_dim + i]; 70*038a8942SZach Atkins u_array[i] = Eval(dim, coord); 71*038a8942SZach Atkins } 72*038a8942SZach Atkins CeedVectorRestoreArrayRead(x_nodes, &x_array); 73*038a8942SZach Atkins CeedVectorSetArray(u, CEED_MEM_HOST, CEED_COPY_VALUES, (CeedScalar *)&u_array); 74*038a8942SZach Atkins } 75*038a8942SZach Atkins 76*038a8942SZach Atkins // Interpolate to arbitrary points 77*038a8942SZach Atkins CeedBasisCreateTensorH1Lagrange(ceed, dim, 1, p, q, CEED_GAUSS, &basis_u); 78*038a8942SZach Atkins { 79*038a8942SZach Atkins CeedScalar x_array[12] = {-0.33, -0.65, 0.16, 0.99, -0.65, 0.16, 0.99, -0.33, 0.16, 0.99, -0.33, -0.65}; 80*038a8942SZach Atkins 81*038a8942SZach Atkins CeedVectorSetArray(x_points, CEED_MEM_HOST, CEED_COPY_VALUES, x_array); 82*038a8942SZach Atkins } 83*038a8942SZach Atkins 84*038a8942SZach Atkins // Calculate G u at arbitrary points, G' * 1 at dofs 85*038a8942SZach Atkins CeedBasisApplyAtPoints(basis_u, num_points, CEED_NOTRANSPOSE, CEED_EVAL_GRAD, x_points, u, u_points); 86*038a8942SZach Atkins CeedBasisApplyAtPoints(basis_u, num_points, CEED_TRANSPOSE, CEED_EVAL_GRAD, x_points, ones, v); 87*038a8942SZach Atkins { 88*038a8942SZach Atkins const CeedScalar *u_array, *v_array, *u_points_array; 89*038a8942SZach Atkins 90*038a8942SZach Atkins CeedVectorGetArrayRead(u, CEED_MEM_HOST, &u_array); 91*038a8942SZach Atkins CeedVectorGetArrayRead(v, CEED_MEM_HOST, &v_array); 92*038a8942SZach Atkins CeedVectorGetArrayRead(u_points, CEED_MEM_HOST, &u_points_array); 93*038a8942SZach Atkins for (CeedInt i = 0; i < p_dim; i++) sum_1 += v_array[i] * u_array[i]; 94*038a8942SZach Atkins for (CeedInt i = 0; i < num_points * dim; i++) sum_2 += u_points_array[i]; 95*038a8942SZach Atkins CeedVectorRestoreArrayRead(u, &u_array); 96*038a8942SZach Atkins CeedVectorRestoreArrayRead(v, &v_array); 97*038a8942SZach Atkins CeedVectorRestoreArrayRead(u_points, &u_points_array); 98*038a8942SZach Atkins } 99*038a8942SZach Atkins CeedScalar tol = GetTolerance(CEED_SCALAR_TYPE, dim); 100*038a8942SZach Atkins if (fabs(sum_1 - sum_2) > tol) printf("[%" CeedInt_FMT "] %f != %f\n", dim, sum_1, sum_2); 101*038a8942SZach Atkins 102*038a8942SZach Atkins CeedVectorDestroy(&x); 103*038a8942SZach Atkins CeedVectorDestroy(&x_nodes); 104*038a8942SZach Atkins CeedVectorDestroy(&x_points); 105*038a8942SZach Atkins CeedVectorDestroy(&u); 106*038a8942SZach Atkins CeedVectorDestroy(&u_points); 107*038a8942SZach Atkins CeedVectorDestroy(&ones); 108*038a8942SZach Atkins CeedVectorDestroy(&v); 109*038a8942SZach Atkins CeedBasisDestroy(&basis_x); 110*038a8942SZach Atkins CeedBasisDestroy(&basis_u); 111*038a8942SZach Atkins } 112*038a8942SZach Atkins CeedDestroy(&ceed); 113*038a8942SZach Atkins return 0; 114*038a8942SZach Atkins } 115