Lines Matching refs:P
33 CeedInt dim, num_comp, num_nodes, P_1d, Q_1d, P, Q; in CeedBasisApplyCore_Magma() local
46 P = P_1d; in CeedBasisApplyCore_Magma()
49 P = Q_1d; in CeedBasisApplyCore_Magma()
92 CeedInt max_P_Q = CeedIntMax(P, Q); in CeedBasisApplyCore_Magma()
98 shared_mem += sizeof(CeedScalar) * num_t_col * (num_comp * (1 * P + 1 * Q)); in CeedBasisApplyCore_Magma()
99 shared_mem += sizeof(CeedScalar) * (P * Q); in CeedBasisApplyCore_Magma()
104 shared_mem += P * Q * sizeof(CeedScalar); // for sT in CeedBasisApplyCore_Magma()
106 shared_mem += num_t_col * (P * max_P_Q * sizeof(CeedScalar)); in CeedBasisApplyCore_Magma()
111 shared_mem += sizeof(CeedScalar) * (P * Q); // for sT in CeedBasisApplyCore_Magma()
113 shared_mem += sizeof(CeedScalar) * num_t_col * (CeedIntMax(P * P * max_P_Q, P * Q * Q)); in CeedBasisApplyCore_Magma()
169 CeedInt max_P_Q = CeedIntMax(P, Q); in CeedBasisApplyCore_Magma()
175 shared_mem += sizeof(CeedScalar) * num_t_col * (num_comp * (1 * P + 1 * Q)); in CeedBasisApplyCore_Magma()
176 shared_mem += sizeof(CeedScalar) * (P * Q); in CeedBasisApplyCore_Magma()
181 shared_mem += sizeof(CeedScalar) * 2 * P * Q; // for sTinterp and sTgrad in CeedBasisApplyCore_Magma()
183 shared_mem += sizeof(CeedScalar) * num_t_col * (P * max_P_Q); in CeedBasisApplyCore_Magma()
188 shared_mem += sizeof(CeedScalar) * 2 * P * Q; // for sTinterp and sTgrad in CeedBasisApplyCore_Magma()
190 … shared_mem += sizeof(CeedScalar) * num_t_col * CeedIntMax(P * P * P, (P * P * Q) + (P * Q * Q)); in CeedBasisApplyCore_Magma()
281 CeedInt num_comp, num_nodes, num_qpts, P, Q, N; in CeedBasisApplyNonTensorCore_Magma() local
292 P = num_nodes; in CeedBasisApplyNonTensorCore_Magma()
304 …if (P <= MAGMA_NONTENSOR_CUSTOM_KERNEL_MAX_P && Q <= MAGMA_NONTENSOR_CUSTOM_KERNEL_MAX_Q && (e_mod… in CeedBasisApplyNonTensorCore_Magma()
340 impl->NB_interp[iN] = nontensor_rtc_get_nb(arch, 'n', q_comp_interp, P, Q, n_array[iN]); in CeedBasisApplyNonTensorCore_Magma()
341 impl->NB_interp_t[iN] = nontensor_rtc_get_nb(arch, 't', q_comp_interp, P, Q, n_array[iN]); in CeedBasisApplyNonTensorCore_Magma()
342 impl->NB_deriv[iN] = nontensor_rtc_get_nb(arch, 'n', q_comp_deriv, P, Q, n_array[iN]); in CeedBasisApplyNonTensorCore_Magma()
343 impl->NB_deriv_t[iN] = nontensor_rtc_get_nb(arch, 't', q_comp_deriv, P, Q, n_array[iN]); in CeedBasisApplyNonTensorCore_Magma()
358 …"BASIS_Q_COMP_DERIV", q_comp_deriv, "BASIS_P", P, "BASIS_Q", Q, "BASIS_NB_INTERP_N", impl->NB_inte… in CeedBasisApplyNonTensorCore_Magma()
405 M = (t_mode == CEED_TRANSPOSE) ? P : Q, K = (t_mode == CEED_TRANSPOSE) ? Q : P; in CeedBasisApplyNonTensorCore_Magma()
407 if (P <= MAGMA_NONTENSOR_CUSTOM_KERNEL_MAX_P && Q <= MAGMA_NONTENSOR_CUSTOM_KERNEL_MAX_Q) { in CeedBasisApplyNonTensorCore_Magma()
427 CeedInt shared_mem_A = P * Q * sizeof(CeedScalar); in CeedBasisApplyNonTensorCore_Magma()
437 …gemm_nontensor(MagmaNoTrans, MagmaNoTrans, P, N, Q, 1.0, d_b + d * P * Q, P, d_u + d * N * Q, Q, b… in CeedBasisApplyNonTensorCore_Magma()
439 …magma_gemm_nontensor(MagmaTrans, MagmaNoTrans, Q, N, P, 1.0, d_b + d * P * Q, P, d_u, P, 0.0, d_v … in CeedBasisApplyNonTensorCore_Magma()