| /libCEED/include/ceed/jit-source/sycl/ |
| H A D | sycl-shared-basis-tensor.h | 22 kernel void Interp(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, global co… in Interp() argument 33 loadMatrix(BASIS_P_1D * BASIS_Q_1D, d_interp_1d, s_B); in Interp() 53 kernel void InterpTranspose(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, … in InterpTranspose() argument 67 loadMatrix(BASIS_P_1D * BASIS_Q_1D, d_interp_1d, s_B); in InterpTranspose() 90 kernel void Grad(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, global cons… in Grad() argument 103 loadMatrix(BASIS_P_1D * BASIS_Q_1D, d_interp_1d, s_B); in Grad() 125 kernel void GradTranspose(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, gl… in GradTranspose() argument 138 loadMatrix(BASIS_P_1D * BASIS_Q_1D, d_interp_1d, s_B); in GradTranspose()
|
| /libCEED/backends/sycl-shared/ |
| H A D | ceed-sycl-shared-basis.sycl.cpp | 71 cgh.set_args(num_elem, impl->d_interp_1d, d_u, d_v); in CeedBasisApplyTensor_Sycl_shared() 94 cgh.set_args(num_elem, impl->d_interp_1d, d_grad_1d, d_u, d_v); in CeedBasisApplyTensor_Sycl_shared() 148 CeedCallSycl(ceed, sycl::free(impl->d_interp_1d, data->sycl_context)); in CeedBasisDestroy_Sycl_shared() 211 …CeedCallSycl(ceed, impl->d_interp_1d = sycl::malloc_device<CeedScalar>(interp_length, data->sycl_d… in CeedBasisCreateTensorH1_Sycl_shared() 212 …sycl::event copy_interp = data->sycl_queue.copy<CeedScalar>(interp_1d, impl->d_interp_1d, interp_l… in CeedBasisCreateTensorH1_Sycl_shared()
|
| H A D | ceed-sycl-shared.hpp | 27 CeedScalar *d_interp_1d; member
|
| /libCEED/backends/hip-shared/ |
| H A D | ceed-hip-shared-basis.c | 121 …CeedCheck(data->d_interp_1d, ceed, CEED_ERROR_BACKEND, "%s not supported; interp_1d not set", Ceed… in CeedBasisApplyTensorCore_Hip_shared() 125 void *interp_args[] = {(void *)&num_elem, &data->d_interp_1d, &d_u, &d_v}; in CeedBasisApplyTensorCore_Hip_shared() 177 void *grad_args[] = {(void *)&num_elem, &data->d_interp_1d, &d_grad_1d, &d_u, &d_v}; in CeedBasisApplyTensorCore_Hip_shared() 540 …CeedCheck(data->d_interp_1d, ceed, CEED_ERROR_BACKEND, "%s not supported; interp not set", CeedEva… in CeedBasisApplyNonTensorCore_Hip_shared() 544 void *interp_args[] = {(void *)&num_elem, &data->d_interp_1d, &d_u, &d_v}; in CeedBasisApplyNonTensorCore_Hip_shared() 643 CeedCallHip(ceed, hipFree(data->d_interp_1d)); in CeedBasisDestroy_Hip_shared() 671 CeedCallHip(ceed, hipMalloc((void **)&data->d_interp_1d, interp_bytes)); in CeedBasisCreateTensorH1_Hip_shared() 672 CeedCallHip(ceed, hipMemcpy(data->d_interp_1d, interp_1d, interp_bytes, hipMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Hip_shared() 762 CeedCallHip(ceed, hipMalloc((void **)&data->d_interp_1d, interp_bytes)); in CeedBasisCreateH1_Hip_shared() 763 CeedCallHip(ceed, hipMemcpy(data->d_interp_1d, interp, interp_bytes, hipMemcpyHostToDevice)); in CeedBasisCreateH1_Hip_shared()
|
| H A D | ceed-hip-shared.h | 31 CeedScalar *d_interp_1d; member
|
| /libCEED/backends/cuda-shared/ |
| H A D | ceed-cuda-shared-basis.c | 53 …CeedCheck(data->d_interp_1d, ceed, CEED_ERROR_BACKEND, "%s not supported; interp_1d not set", Ceed… in CeedBasisApplyTensorCore_Cuda_shared() 58 void *interp_args[] = {(void *)&num_elem, &data->d_interp_1d, &d_u, &d_v}; in CeedBasisApplyTensorCore_Cuda_shared() 112 void *grad_args[] = {(void *)&num_elem, &data->d_interp_1d, &d_grad_1d, &d_u, &d_v}; in CeedBasisApplyTensorCore_Cuda_shared() 476 …CeedCheck(data->d_interp_1d, ceed, CEED_ERROR_BACKEND, "%s not supported; interp not set", CeedEva… in CeedBasisApplyNonTensorCore_Cuda_shared() 481 void *interp_args[] = {(void *)&num_elem, &data->d_interp_1d, &d_u, &d_v}; in CeedBasisApplyNonTensorCore_Cuda_shared() 582 CeedCallCuda(ceed, cudaFree(data->d_interp_1d)); in CeedBasisDestroy_Cuda_shared() 610 CeedCallCuda(ceed, cudaMalloc((void **)&data->d_interp_1d, interp_bytes)); in CeedBasisCreateTensorH1_Cuda_shared() 611 …CeedCallCuda(ceed, cudaMemcpy(data->d_interp_1d, interp_1d, interp_bytes, cudaMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Cuda_shared() 696 CeedCallCuda(ceed, cudaMalloc((void **)&data->d_interp_1d, interp_bytes)); in CeedBasisCreateH1_Cuda_shared() 697 CeedCallCuda(ceed, cudaMemcpy(data->d_interp_1d, interp, interp_bytes, cudaMemcpyHostToDevice)); in CeedBasisCreateH1_Cuda_shared()
|
| H A D | ceed-cuda-shared.h | 30 CeedScalar *d_interp_1d; member
|
| /libCEED/backends/magma/ |
| H A D | ceed-magma.h | 55 CeedScalar *d_interp_1d; member
|
| H A D | ceed-magma-basis.c | 117 …void *args[] = {&impl->d_interp_1d, &d_u, &u_elem_stride, &u_comp_stride, &d_v, &v_elem_stride, … in CeedBasisApplyCore_Magma() 194 …void *args[] = {&impl->d_interp_1d, &impl->d_grad_1d, &d_u, &u_elem_stride, &u_comp_str… in CeedBasisApplyCore_Magma() 492 CeedCallBackend(magma_free(impl->d_interp_1d)); in CeedBasisDestroy_Magma() 551 CeedCallBackend(magma_malloc((void **)&impl->d_interp_1d, Q_1d * P_1d * sizeof(interp_1d[0]))); in CeedBasisCreateTensorH1_Magma() 552 …magma_setvector(Q_1d * P_1d, sizeof(interp_1d[0]), interp_1d, 1, impl->d_interp_1d, 1, data->queue… in CeedBasisCreateTensorH1_Magma()
|
| /libCEED/backends/hip-ref/ |
| H A D | ceed-hip-ref-basis.c | 51 …void *interp_args[] = {(void *)&num_elem, (void *)&is_transpose, &data->d_interp_1d, &d_u,… in CeedBasisApplyCore_Hip() 57 …void *grad_args[] = {(void *)&num_elem, (void *)&is_transpose, &data->d_interp_1d, &data->… in CeedBasisApplyCore_Hip() 367 CeedCallHip(ceed, hipFree(data->d_interp_1d)); in CeedBasisDestroy_Hip() 414 CeedCallHip(ceed, hipMalloc((void **)&data->d_interp_1d, interp_bytes)); in CeedBasisCreateTensorH1_Hip() 415 CeedCallHip(ceed, hipMemcpy(data->d_interp_1d, interp_1d, interp_bytes, hipMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Hip()
|
| H A D | ceed-hip-ref.h | 81 CeedScalar *d_interp_1d; member
|
| /libCEED/backends/cuda-ref/ |
| H A D | ceed-cuda-ref-basis.c | 51 …void *interp_args[] = {(void *)&num_elem, (void *)&is_transpose, &data->d_interp_1d, &d_u,… in CeedBasisApplyCore_Cuda() 57 …void *grad_args[] = {(void *)&num_elem, (void *)&is_transpose, &data->d_interp_1d, &data->… in CeedBasisApplyCore_Cuda() 368 CeedCallCuda(ceed, cudaFree(data->d_interp_1d)); in CeedBasisDestroy_Cuda() 415 CeedCallCuda(ceed, cudaMalloc((void **)&data->d_interp_1d, interp_bytes)); in CeedBasisCreateTensorH1_Cuda() 416 …CeedCallCuda(ceed, cudaMemcpy(data->d_interp_1d, interp_1d, interp_bytes, cudaMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Cuda()
|
| H A D | ceed-cuda-ref.h | 76 CeedScalar *d_interp_1d; member
|
| /libCEED/backends/sycl-ref/ |
| H A D | ceed-sycl-ref.hpp | 56 CeedScalar *d_interp_1d; member
|
| H A D | ceed-sycl-ref-basis.sycl.cpp | 43 const CeedScalar *interp_1d = impl->d_interp_1d; in CeedBasisApplyInterp_Sycl() 146 const CeedScalar *interp_1d = impl->d_interp_1d; in CeedBasisApplyGrad_Sycl() 527 CeedCallSycl(ceed, sycl::free(impl->d_interp_1d, data->sycl_context)); in CeedBasisDestroy_Sycl() 598 …CeedCallSycl(ceed, impl->d_interp_1d = sycl::malloc_device<CeedScalar>(interp_length, data->sycl_d… in CeedBasisCreateTensorH1_Sycl() 599 …sycl::event copy_interp = data->sycl_queue.copy<CeedScalar>(interp_1d, impl->d_interp_1d, interp_l… in CeedBasisCreateTensorH1_Sycl()
|
| /libCEED/backends/sycl-gen/ |
| H A D | ceed-sycl-gen-operator-build.sycl.cpp | 300 h_B.inputs[i] = basis_impl->d_interp_1d; in CeedOperatorBuildKernel_Sycl_gen() 306 h_B.inputs[i] = basis_impl->d_interp_1d; in CeedOperatorBuildKernel_Sycl_gen() 358 h_B.outputs[i] = basis_impl->d_interp_1d; in CeedOperatorBuildKernel_Sycl_gen() 364 h_B.outputs[i] = basis_impl->d_interp_1d; in CeedOperatorBuildKernel_Sycl_gen()
|
| /libCEED/backends/hip-gen/ |
| H A D | ceed-hip-gen-operator-build.cpp | 291 if (is_input) data->B.inputs[i] = basis_data->d_interp_1d; in CeedOperatorBuildKernelFieldData_Hip_gen() 292 else data->B.outputs[i] = basis_data->d_interp_1d; in CeedOperatorBuildKernelFieldData_Hip_gen() 329 if (is_input) data->B.inputs[i] = basis_data->d_interp_1d; in CeedOperatorBuildKernelFieldData_Hip_gen() 330 else data->B.outputs[i] = basis_data->d_interp_1d; in CeedOperatorBuildKernelFieldData_Hip_gen()
|
| /libCEED/backends/cuda-gen/ |
| H A D | ceed-cuda-gen-operator-build.cpp | 264 if (is_input) data->B.inputs[i] = basis_data->d_interp_1d; in CeedOperatorBuildKernelFieldData_Cuda_gen() 265 else data->B.outputs[i] = basis_data->d_interp_1d; in CeedOperatorBuildKernelFieldData_Cuda_gen() 302 if (is_input) data->B.inputs[i] = basis_data->d_interp_1d; in CeedOperatorBuildKernelFieldData_Cuda_gen() 303 else data->B.outputs[i] = basis_data->d_interp_1d; in CeedOperatorBuildKernelFieldData_Cuda_gen()
|