| /libCEED/backends/hip-shared/ |
| H A D | ceed-hip-shared-basis.c | 222 void *weight_args[] = {(void *)&num_elem, (void *)&data->d_q_weight_1d, &d_v}; in CeedBasisApplyTensorCore_Hip_shared() local 229 …ackend(CeedRunKernelDim_Hip(ceed, data->Weight, grid_size, Q_1d, elems_per_block, 1, weight_args)); in CeedBasisApplyTensorCore_Hip_shared() 235 …end(CeedRunKernelDim_Hip(ceed, data->Weight, grid_size, Q_1d, Q_1d, elems_per_block, weight_args)); in CeedBasisApplyTensorCore_Hip_shared() 241 …end(CeedRunKernelDim_Hip(ceed, data->Weight, grid_size, Q_1d, Q_1d, elems_per_block, weight_args)); in CeedBasisApplyTensorCore_Hip_shared() 590 void *weight_args[] = {(void *)&num_elem, (void *)&data->d_q_weight_1d, &d_v}; in CeedBasisApplyNonTensorCore_Hip_shared() local 597 …kend(CeedRunKernelDim_Hip(ceed, data->Weight, grid_size, thread, elems_per_block, 1, weight_args)); in CeedBasisApplyNonTensorCore_Hip_shared()
|
| /libCEED/backends/cuda-shared/ |
| H A D | ceed-cuda-shared-basis.c | 158 void *weight_args[] = {(void *)&num_elem, (void *)&data->d_q_weight_1d, &d_v}; in CeedBasisApplyTensorCore_Cuda_shared() local 163 …ckend(CeedRunKernelDim_Cuda(ceed, data->Weight, grid_size, Q_1d, elems_per_block, 1, weight_args)); in CeedBasisApplyTensorCore_Cuda_shared() 169 …nd(CeedRunKernelDim_Cuda(ceed, data->Weight, grid_size, Q_1d, Q_1d, elems_per_block, weight_args)); in CeedBasisApplyTensorCore_Cuda_shared() 175 …nd(CeedRunKernelDim_Cuda(ceed, data->Weight, grid_size, Q_1d, Q_1d, elems_per_block, weight_args)); in CeedBasisApplyTensorCore_Cuda_shared() 529 void *weight_args[] = {(void *)&num_elem, (void *)&data->d_q_weight_1d, &d_v}; in CeedBasisApplyNonTensorCore_Cuda_shared() local 536 …lBackend(CeedRunKernelDim_Cuda(ceed, data->Weight, grid, thread, elems_per_block, 1, weight_args)); in CeedBasisApplyNonTensorCore_Cuda_shared()
|
| /libCEED/backends/hip-ref/ |
| H A D | ceed-hip-ref-basis.c | 64 void *weight_args[] = {(void *)&num_elem, (void *)&data->d_q_weight_1d, &d_v}; in CeedBasisApplyCore_Hip() local 68 …nd(CeedRunKernelDim_Hip(ceed, data->Weight, num_elem, block_size_x, block_size_y, 1, weight_args)); in CeedBasisApplyCore_Hip() 325 void *weight_args[] = {(void *)&num_elem, (void *)&data->d_q_weight, &d_v}; in CeedBasisApplyNonTensorCore_Hip() local 327 …Backend(CeedRunKernelDim_Hip(ceed, data->Weight, grid, num_qpts, 1, elems_per_block, weight_args)); in CeedBasisApplyNonTensorCore_Hip()
|
| /libCEED/backends/cuda-ref/ |
| H A D | ceed-cuda-ref-basis.c | 64 void *weight_args[] = {(void *)&num_elem, (void *)&data->d_q_weight_1d, &d_v}; in CeedBasisApplyCore_Cuda() local 68 …d(CeedRunKernelDim_Cuda(ceed, data->Weight, num_elem, block_size_x, block_size_y, 1, weight_args)); in CeedBasisApplyCore_Cuda() 326 void *weight_args[] = {(void *)&num_elem, (void *)&data->d_q_weight, &d_v}; in CeedBasisApplyNonTensorCore_Cuda() local 328 …ackend(CeedRunKernelDim_Cuda(ceed, data->Weight, grid, num_qpts, 1, elems_per_block, weight_args)); in CeedBasisApplyNonTensorCore_Cuda()
|