Lines Matching refs:elems_per_block
260 const int elems_per_block = 1; in CeedBasisApplyNonTensorCore_Cuda() local
261 const int grid = CeedDivUpInt(num_elem, elems_per_block); in CeedBasisApplyNonTensorCore_Cuda()
289 …unKernelDim_Cuda(ceed, data->InterpTranspose, grid, block_size_x, 1, elems_per_block, interp_args)… in CeedBasisApplyNonTensorCore_Cuda()
291 …end(CeedRunKernelDim_Cuda(ceed, data->Interp, grid, block_size_x, 1, elems_per_block, interp_args)… in CeedBasisApplyNonTensorCore_Cuda()
299 …dRunKernelDim_Cuda(ceed, data->DerivTranspose, grid, block_size_x, 1, elems_per_block, grad_args)); in CeedBasisApplyNonTensorCore_Cuda()
301 …ckend(CeedRunKernelDim_Cuda(ceed, data->Deriv, grid, block_size_x, 1, elems_per_block, grad_args)); in CeedBasisApplyNonTensorCore_Cuda()
309 …edRunKernelDim_Cuda(ceed, data->DerivTranspose, grid, block_size_x, 1, elems_per_block, div_args)); in CeedBasisApplyNonTensorCore_Cuda()
311 …ackend(CeedRunKernelDim_Cuda(ceed, data->Deriv, grid, block_size_x, 1, elems_per_block, div_args)); in CeedBasisApplyNonTensorCore_Cuda()
319 …dRunKernelDim_Cuda(ceed, data->DerivTranspose, grid, block_size_x, 1, elems_per_block, curl_args)); in CeedBasisApplyNonTensorCore_Cuda()
321 …ckend(CeedRunKernelDim_Cuda(ceed, data->Deriv, grid, block_size_x, 1, elems_per_block, curl_args)); in CeedBasisApplyNonTensorCore_Cuda()
328 …CeedCallBackend(CeedRunKernelDim_Cuda(ceed, data->Weight, grid, num_qpts, 1, elems_per_block, weig… in CeedBasisApplyNonTensorCore_Cuda()