Home
last modified time | relevance | path

Searched refs:kernel (Results 1 – 18 of 18) sorted by relevance

/libCEED/backends/sycl-shared/
H A Dceed-sycl-shared.hpp22 sycl::kernel *interp_kernel;
23 sycl::kernel *interp_transpose_kernel;
24 sycl::kernel *grad_kernel;
25 sycl::kernel *grad_transpose_kernel;
26 sycl::kernel *weight_kernel;
H A Dceed-sycl-shared-basis.sycl.cpp64 …sycl::kernel *interp_kernel = (t_mode == CEED_TRANSPOSE) ? impl->interp_transpose_kernel : impl->i… in CeedBasisApplyTensor_Sycl_shared()
85 …sycl::kernel *grad_kernel = (t_mode == CEED_TRANSPOSE) ? impl->grad_transpose_kernel : impl->g… in CeedBasisApplyTensor_Sycl_shared()
/libCEED/backends/cuda/
H A Dceed-cuda-compile.h18 CEED_INTERN int CeedGetKernel_Cuda(Ceed ceed, CUmodule module, const char *name, CUfunction *kernel
20 CEED_INTERN int CeedRunKernel_Cuda(Ceed ceed, CUfunction kernel, int grid_size, int block_size, voi…
22 CEED_INTERN int CeedRunKernelAutoblockCuda(Ceed ceed, CUfunction kernel, size_t points, void **args…
24 CEED_INTERN int CeedRunKernelDim_Cuda(Ceed ceed, CUfunction kernel, int grid_size, int block_size_x…
26 CEED_INTERN int CeedRunKernelDimShared_Cuda(Ceed ceed, CUfunction kernel, CUstream stream, int grid…
28 CEED_INTERN int CeedTryRunKernelDimShared_Cuda(Ceed ceed, CUfunction kernel, CUstream stream, int g…
H A Dceed-cuda-compile.cpp433 int CeedGetKernel_Cuda(Ceed ceed, CUmodule module, const char *name, CUfunction *kernel) { in CeedGetKernel_Cuda() argument
434 CeedCallCuda(ceed, cuModuleGetFunction(kernel, module, name)); in CeedGetKernel_Cuda()
443 int CeedRunKernelAutoblockCuda(Ceed ceed, CUfunction kernel, size_t points, void **args) { in CeedRunKernelAutoblockCuda() argument
446 …CeedCallCuda(ceed, cuOccupancyMaxPotentialBlockSize(&min_grid_size, &max_block_size, kernel, NULL,… in CeedRunKernelAutoblockCuda()
447 …CeedCallBackend(CeedRunKernel_Cuda(ceed, kernel, CeedDivUpInt(points, max_block_size), max_block_s… in CeedRunKernelAutoblockCuda()
454 int CeedRunKernel_Cuda(Ceed ceed, CUfunction kernel, const int grid_size, const int block_size, voi… in CeedRunKernel_Cuda() argument
455 …CeedCallBackend(CeedRunKernelDimShared_Cuda(ceed, kernel, NULL, grid_size, block_size, 1, 1, 0, ar… in CeedRunKernel_Cuda()
462 int CeedRunKernelDim_Cuda(Ceed ceed, CUfunction kernel, const int grid_size, const int block_size_x… in CeedRunKernelDim_Cuda() argument
464 …CeedCallBackend(CeedRunKernelDimShared_Cuda(ceed, kernel, NULL, grid_size, block_size_x, block_siz… in CeedRunKernelDim_Cuda()
471 static int CeedRunKernelDimSharedCore_Cuda(Ceed ceed, CUfunction kernel, CUstream stream, const int… in CeedRunKernelDimSharedCore_Cuda() argument
[all …]
/libCEED/backends/hip/
H A Dceed-hip-compile.h18 …TERN int CeedGetKernel_Hip(Ceed ceed, hipModule_t module, const char *name, hipFunction_t *kernel);
20 CEED_INTERN int CeedRunKernel_Hip(Ceed ceed, hipFunction_t kernel, int grid_size, int block_size, v…
22 CEED_INTERN int CeedRunKernelDim_Hip(Ceed ceed, hipFunction_t kernel, int grid_size, int block_size…
25 CEED_INTERN int CeedRunKernelDimShared_Hip(Ceed ceed, hipFunction_t kernel, hipStream_t stream, int…
27 CEED_INTERN int CeedTryRunKernelDimShared_Hip(Ceed ceed, hipFunction_t kernel, hipStream_t stream, …
H A Dceed-hip-compile.cpp204 int CeedGetKernel_Hip(Ceed ceed, hipModule_t module, const char *name, hipFunction_t *kernel) { in CeedGetKernel_Hip() argument
205 CeedCallHip(ceed, hipModuleGetFunction(kernel, module, name)); in CeedGetKernel_Hip()
212 int CeedRunKernel_Hip(Ceed ceed, hipFunction_t kernel, const int grid_size, const int block_size, v… in CeedRunKernel_Hip() argument
213 …CeedCallHip(ceed, hipModuleLaunchKernel(kernel, grid_size, 1, 1, block_size, 1, 1, 0, NULL, args, … in CeedRunKernel_Hip()
220 int CeedRunKernelDim_Hip(Ceed ceed, hipFunction_t kernel, const int grid_size, const int block_size… in CeedRunKernelDim_Hip() argument
222 …CeedCallHip(ceed, hipModuleLaunchKernel(kernel, grid_size, 1, 1, block_size_x, block_size_y, block… in CeedRunKernelDim_Hip()
229 static int CeedRunKernelDimSharedCore_Hip(Ceed ceed, hipFunction_t kernel, hipStream_t stream, cons… in CeedRunKernelDimSharedCore_Hip() argument
232 …hipError_t result = hipModuleLaunchKernel(kernel, grid_size, 1, 1, block_size_x, block_size_y, blo… in CeedRunKernelDimSharedCore_Hip()
253 int CeedRunKernelDimShared_Hip(Ceed ceed, hipFunction_t kernel, hipStream_t stream, const int grid_… in CeedRunKernelDimShared_Hip() argument
257 …CeedCallBackend(CeedRunKernelDimSharedCore_Hip(ceed, kernel, stream, grid_size, block_size_x, bloc… in CeedRunKernelDimShared_Hip()
[all …]
/libCEED/backends/xsmm/
H A Dceed-xsmm-tensor.c29 …const libxsmm_gemmfunction kernel = libxsmm_dispatch_gemm(gemm_shape, (libxsmm_bitfield)(flags), (… in CeedTensorContractApply_Xsmm() local
32 …CeedCheck(kernel, CeedTensorContractReturnCeed(contract), CEED_ERROR_BACKEND, "LIBXSMM kernel fail… in CeedTensorContractApply_Xsmm()
38 kernel(&gemm_param); in CeedTensorContractApply_Xsmm()
49 …const libxsmm_gemmfunction kernel = libxsmm_dispatch_gemm(gemm_shape, (libxsmm_bitfield)(flags), (… in CeedTensorContractApply_Xsmm() local
52 …CeedCheck(kernel, CeedTensorContractReturnCeed(contract), CEED_ERROR_BACKEND, "LIBXSMM kernel fail… in CeedTensorContractApply_Xsmm()
59 kernel(&gemm_param); in CeedTensorContractApply_Xsmm()
/libCEED/backends/sycl/
H A Dceed-sycl-compile.hpp19 …ceed, const SyclModule_t *sycl_module, const std::string &kernel_name, sycl::kernel **sycl_kernel);
21 CEED_INTERN int CeedRunKernelDimSharedSycl(Ceed ceed, sycl::kernel *kernel, const int grid_size, co…
H A Dceed-sycl-compile.sycl.cpp143 …eed, const SyclModule_t *sycl_module, const std::string &kernel_name, sycl::kernel **sycl_kernel) { in CeedGetKernel_Sycl()
160 …*sycl_kernel = new sycl::kernel(sycl::make_kernel<sycl::backend::ext_oneapi_level_zero>({*sycl_mod… in CeedGetKernel_Sycl()
169 int CeedRunKernelDimSharedSycl(Ceed ceed, sycl::kernel *kernel, const int grid_size, const int bloc… in CeedRunKernelDimSharedSycl() argument
185 cgh.parallel_for(kernel_range, *kernel); in CeedRunKernelDimSharedSycl()
/libCEED/include/ceed/jit-source/sycl/
H A Dsycl-shared-basis-tensor.h22 kernel void Interp(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, global co… in Interp()
53 kernel void InterpTranspose(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, … in InterpTranspose()
90 kernel void Grad(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, global cons… in Grad()
125 kernel void GradTranspose(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, gl… in GradTranspose()
163 kernel void Weight(const CeedInt num_elem, global const CeedScalar *restrict q_weight_1d, global Ce… in Weight()
/libCEED/backends/sycl-gen/
H A Dceed-sycl-gen.hpp21 sycl::kernel *op;
/libCEED/backends/sycl-ref/
H A Dceed-sycl-ref.hpp73 sycl::kernel *QFunction;
/libCEED/doc/sphinx/source/
H A DlibCEEDdev.md73kernel launches, following the libCEED operator decomposition, where first {ref}`CeedElemRestricti…
74 …y to all points across all elements in order to maximize the amount of work each kernel launch has.
83kernel to apply the action of the {ref}`CeedOperator`, significantly improving performance by elim…
84 This kernel is compiled at runtime via NVRTC, HIPRTC, or OpenCL RTC.
H A Dreleasenotes.md168 …ionGetKernelName`; refactored {c:func}`CeedQFunctionGetSourcePath` to exclude function kernel name.
186 - Added {c:func}`CeedPathConcatenate` to facilitate loading kernel source files with a path relativ…
196 - Put GPU JiTed kernel source code into separate files.
H A DlibCEEDapi.md158 … $\bm{B}$, $\bm{\mathcal{E}}$ and $\bm{P}$, starting from its point-wise kernel $\bm{D}$, a "matve…
/libCEED/examples/
H A DREADME.md47 …ctor** and include parallel scatter, element scatter, element evaluation kernel, element gather, a…
/libCEED/examples/fluids/
H A Dindex.md437 …filter width scaling tensor (also a rank 2 SPD tensor), and $\beta$ is a kernel scaling factor on …
452 …s common to denote a filter width dimensioned relative to the radial distance of the filter kernel.
512 #### Filter kernel scaling, β
513 … a certain physical filter width, the actual width of the implied filter kernel is quite larger th…
515 To match the "size" of a normal kernel to our differential kernel, we attempt to have them match se…
H A DREADME.md653 - Scaling to make differential kernel size equivalent to other filter kernels