| /libCEED/include/ceed/jit-source/hip/ |
| H A D | hip-ref-basis-nontensor.h | 21 extern "C" __global__ void Interp(const CeedInt num_elem, const CeedScalar *__restrict__ d_B, const… in Interp() 29 extern "C" __global__ void InterpTranspose(const CeedInt num_elem, const CeedScalar *__restrict__ d… in InterpTranspose() 40 extern "C" __global__ void Deriv(const CeedInt num_elem, const CeedScalar *__restrict__ d_B, const … in Deriv() 48 extern "C" __global__ void DerivTranspose(const CeedInt num_elem, const CeedScalar *__restrict__ d_… in DerivTranspose() 59 extern "C" __global__ void Weight(const CeedInt num_elem, const CeedScalar *__restrict__ q_weight, … in Weight()
|
| H A D | hip-ref-basis-tensor.h | 19 extern "C" __global__ void Interp(const CeedInt num_elem, const CeedInt is_transpose, const CeedSca… in Interp() 77 extern "C" __global__ void Grad(const CeedInt num_elem, const CeedInt is_transpose, const CeedScala… in Grad() 142 __device__ void Weight1d(const CeedInt num_elem, const CeedScalar *q_weight_1d, CeedScalar *w) { in Weight1d() 155 __device__ void Weight2d(const CeedInt num_elem, const CeedScalar *q_weight_1d, CeedScalar *w) { in Weight2d() 173 __device__ void Weight3d(const CeedInt num_elem, const CeedScalar *q_weight_1d, CeedScalar *w) { in Weight3d() 193 extern "C" __global__ void Weight(const CeedInt num_elem, const CeedScalar *__restrict__ q_weight_1… in Weight()
|
| /libCEED/include/ceed/jit-source/cuda/ |
| H A D | cuda-ref-basis-nontensor.h | 21 extern "C" __global__ void Interp(const CeedInt num_elem, const CeedScalar *__restrict__ d_B, const… in Interp() 29 extern "C" __global__ void InterpTranspose(const CeedInt num_elem, const CeedScalar *__restrict__ d… in InterpTranspose() 40 extern "C" __global__ void Deriv(const CeedInt num_elem, const CeedScalar *__restrict__ d_B, const … in Deriv() 48 extern "C" __global__ void DerivTranspose(const CeedInt num_elem, const CeedScalar *__restrict__ d_… in DerivTranspose() 59 extern "C" __global__ void Weight(const CeedInt num_elem, const CeedScalar *__restrict__ q_weight, … in Weight()
|
| H A D | cuda-shared-basis-tensor.h | 18 extern "C" __global__ void Interp(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *… in Interp() 56 extern "C" __global__ void InterpCollocated(const CeedInt num_elem, const CeedScalar *c_B, const Ce… in InterpCollocated() 86 extern "C" __global__ void InterpTranspose(const CeedInt num_elem, const CeedScalar *c_B, const Cee… in InterpTranspose() 125 extern "C" __global__ void InterpCollocatedTranspose(const CeedInt num_elem, const CeedScalar *c_B,… in InterpCollocatedTranspose() 155 extern "C" __global__ void InterpTransposeAdd(const CeedInt num_elem, const CeedScalar *c_B, const … in InterpTransposeAdd() 194 extern "C" __global__ void InterpCollocatedTransposeAdd(const CeedInt num_elem, const CeedScalar *c… in InterpCollocatedTransposeAdd() 227 extern "C" __global__ void Grad(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *c_… in Grad() 270 extern "C" __global__ void GradCollocated(const CeedInt num_elem, const CeedScalar *c_B, const Ceed… in GradCollocated() 310 extern "C" __global__ void GradTranspose(const CeedInt num_elem, const CeedScalar *c_B, const CeedS… in GradTranspose() 353 extern "C" __global__ void GradCollocatedTranspose(const CeedInt num_elem, const CeedScalar *c_B, c… in GradCollocatedTranspose() [all …]
|
| H A D | cuda-shared-basis-nontensor.h | 18 extern "C" __global__ void Interp(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *… in Interp() 44 extern "C" __global__ void InterpTranspose(const CeedInt num_elem, const CeedScalar *c_B, const Cee… in InterpTranspose() 71 extern "C" __global__ void InterpTransposeAdd(const CeedInt num_elem, const CeedScalar *c_B, const … in InterpTransposeAdd() 101 extern "C" __global__ void Grad(const CeedInt num_elem, const CeedScalar *c_G, const CeedScalar *__… in Grad() 127 extern "C" __global__ void GradTranspose(const CeedInt num_elem, const CeedScalar *c_G, const CeedS… in GradTranspose() 154 extern "C" __global__ void GradTransposeAdd(const CeedInt num_elem, const CeedScalar *c_G, const Ce… in GradTransposeAdd() 184 extern "C" __global__ void Weight(const CeedInt num_elem, const CeedScalar *__restrict__ q_weight, … in Weight()
|
| H A D | cuda-shared-basis-tensor-at-points.h | 23 extern "C" __global__ void InterpAtPoints(const CeedInt num_elem, const CeedScalar *__restrict__ c_… in InterpAtPoints() 78 extern "C" __global__ void InterpTransposeAtPoints(const CeedInt num_elem, const CeedScalar *__rest… in InterpTransposeAtPoints() 148 extern "C" __global__ void InterpTransposeAddAtPoints(const CeedInt num_elem, const CeedScalar *__r… in InterpTransposeAddAtPoints() 210 extern "C" __global__ void GradAtPoints(const CeedInt num_elem, const CeedScalar *__restrict__ c_B,… in GradAtPoints() 265 extern "C" __global__ void GradTransposeAtPoints(const CeedInt num_elem, const CeedScalar *__restri… in GradTransposeAtPoints() 336 extern "C" __global__ void GradTransposeAddAtPoints(const CeedInt num_elem, const CeedScalar *__res… in GradTransposeAddAtPoints()
|
| H A D | cuda-ref-basis-tensor.h | 19 extern "C" __global__ void Interp(const CeedInt num_elem, const CeedInt is_transpose, const CeedSca… in Interp() 77 extern "C" __global__ void Grad(const CeedInt num_elem, const CeedInt is_transpose, const CeedScala… in Grad() 142 __device__ void Weight1d(const CeedInt num_elem, const CeedScalar *q_weight_1d, CeedScalar *w) { in Weight1d() 155 __device__ void Weight2d(const CeedInt num_elem, const CeedScalar *q_weight_1d, CeedScalar *w) { in Weight2d() 173 __device__ void Weight3d(const CeedInt num_elem, const CeedScalar *q_weight_1d, CeedScalar *w) { in Weight3d() 193 extern "C" __global__ void Weight(const CeedInt num_elem, const CeedScalar *__restrict__ q_weight_1… in Weight()
|
| /libCEED/include/ceed/jit-source/sycl/ |
| H A D | sycl-shared-basis-tensor.h | 22 kernel void Interp(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, global co… in Interp() 53 kernel void InterpTranspose(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, … in InterpTranspose() 90 kernel void Grad(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, global cons… in Grad() 125 kernel void GradTranspose(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, gl… in GradTranspose() 163 kernel void Weight(const CeedInt num_elem, global const CeedScalar *restrict q_weight_1d, global Ce… in Weight()
|
| H A D | sycl-gen-templates.h | 33 …t1d(const CeedInt num_comp, const CeedInt strides_comp, const CeedInt P_1D, const CeedInt num_elem, in readDofsOffset1d() 51 … const CeedInt strides_elem, const CeedInt num_elem, global const CeedScalar *restrict d_u, in readDofsStrided1d() 68 …t1d(const CeedInt num_comp, const CeedInt strides_comp, const CeedInt P_1D, const CeedInt num_elem, in writeDofsOffset1d() 85 … const CeedInt strides_elem, const CeedInt num_elem, private const CeedScalar *restrict r_v, in writeDofsStrided1d() 106 …t2d(const CeedInt num_comp, const CeedInt strides_comp, const CeedInt P_1D, const CeedInt num_elem, in readDofsOffset2d() 123 … const CeedInt strides_elem, const CeedInt num_elem, const global CeedScalar *restrict d_u, in readDofsStrided2d() 139 …t2d(const CeedInt num_comp, const CeedInt strides_comp, const CeedInt P_1D, const CeedInt num_elem, in writeDofsOffset2d() 157 … const CeedInt strides_elem, const CeedInt num_elem, const private CeedScalar *restrict r_v, in writeDofsStrided2d() 177 …t3d(const CeedInt num_comp, const CeedInt strides_comp, const CeedInt P_1D, const CeedInt num_elem, in readDofsOffset3d() 196 … const CeedInt strides_elem, const CeedInt num_elem, const global CeedScalar *restrict d_u, in readDofsStrided3d() [all …]
|
| H A D | sycl-shared-basis-read-write-templates.h | 28 inline void ReadElementStrided1d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_elem… in ReadElementStrided1d() 46 …riteElementStrided1d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_elem, const Cee… in WriteElementStrided1d() 68 inline void ReadElementStrided2d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_elem… in ReadElementStrided2d() 87 …riteElementStrided2d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_elem, const Cee… in WriteElementStrided2d() 110 inline void ReadElementStrided3d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_elem… in ReadElementStrided3d() 131 …riteElementStrided3d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_elem, const Cee… in WriteElementStrided3d()
|
| /libCEED/interface/ |
| H A D | ceed-elemrestriction.c | 38 …(const CeedInt *offsets, CeedInt *block_offsets, CeedInt num_block, CeedInt num_elem, CeedInt bloc… in CeedPermutePadOffsets() 64 …rients(const bool *orients, bool *block_orients, CeedInt num_block, CeedInt num_elem, CeedInt bloc… in CeedPermutePadOrients() 89 …nt8 *curl_orients, CeedInt8 *block_curl_orients, CeedInt num_block, CeedInt num_elem, CeedInt bloc… in CeedPermutePadCurlOrients() 657 int CeedElemRestrictionCreate(Ceed ceed, CeedInt num_elem, CeedInt elem_size, CeedInt num_comp, Cee… in CeedElemRestrictionCreate() 712 int CeedElemRestrictionCreateOriented(Ceed ceed, CeedInt num_elem, CeedInt elem_size, CeedInt num_c… in CeedElemRestrictionCreateOriented() 770 int CeedElemRestrictionCreateCurlOriented(Ceed ceed, CeedInt num_elem, CeedInt elem_size, CeedInt n… in CeedElemRestrictionCreateCurlOriented() 824 int CeedElemRestrictionCreateStrided(Ceed ceed, CeedInt num_elem, CeedInt elem_size, CeedInt num_co… in CeedElemRestrictionCreateStrided() 891 int CeedElemRestrictionCreateAtPoints(Ceed ceed, CeedInt num_elem, CeedInt num_points, CeedInt num_… in CeedElemRestrictionCreateAtPoints() 950 int CeedElemRestrictionCreateBlocked(Ceed ceed, CeedInt num_elem, CeedInt elem_size, CeedInt block_… in CeedElemRestrictionCreateBlocked() 1018 int CeedElemRestrictionCreateBlockedOriented(Ceed ceed, CeedInt num_elem, CeedInt elem_size, CeedIn… in CeedElemRestrictionCreateBlockedOriented() [all …]
|
| /libCEED/backends/hip-ref/ |
| H A D | ceed-hip-ref-basis.c | 21 static int CeedBasisApplyCore_Hip(CeedBasis basis, bool apply_add, const CeedInt num_elem, CeedTran… in CeedBasisApplyCore_Hip() 87 static int CeedBasisApply_Hip(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t_mode, Ce… in CeedBasisApply_Hip() 92 static int CeedBasisApplyAdd_Hip(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t_mode,… in CeedBasisApplyAdd_Hip() 101 static int CeedBasisApplyAtPointsCore_Hip(CeedBasis basis, bool apply_add, const CeedInt num_elem, … in CeedBasisApplyAtPointsCore_Hip() 239 static int CeedBasisApplyAtPoints_Hip(CeedBasis basis, const CeedInt num_elem, const CeedInt *num_p… in CeedBasisApplyAtPoints_Hip() 245 static int CeedBasisApplyAddAtPoints_Hip(CeedBasis basis, const CeedInt num_elem, const CeedInt *nu… in CeedBasisApplyAddAtPoints_Hip() 254 static int CeedBasisApplyNonTensorCore_Hip(CeedBasis basis, bool apply_add, const CeedInt num_elem,… in CeedBasisApplyNonTensorCore_Hip() 341 static int CeedBasisApplyNonTensor_Hip(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t… in CeedBasisApplyNonTensor_Hip() 347 static int CeedBasisApplyAddNonTensor_Hip(CeedBasis basis, const CeedInt num_elem, CeedTransposeMod… in CeedBasisApplyAddNonTensor_Hip()
|
| /libCEED/backends/cuda-ref/ |
| H A D | ceed-cuda-ref-basis.c | 22 static int CeedBasisApplyCore_Cuda(CeedBasis basis, bool apply_add, const CeedInt num_elem, CeedTra… in CeedBasisApplyCore_Cuda() 87 static int CeedBasisApply_Cuda(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t_mode, C… in CeedBasisApply_Cuda() 93 static int CeedBasisApplyAdd_Cuda(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t_mode… in CeedBasisApplyAdd_Cuda() 102 static int CeedBasisApplyAtPointsCore_Cuda(CeedBasis basis, bool apply_add, const CeedInt num_elem,… in CeedBasisApplyAtPointsCore_Cuda() 240 static int CeedBasisApplyAtPoints_Cuda(CeedBasis basis, const CeedInt num_elem, const CeedInt *num_… in CeedBasisApplyAtPoints_Cuda() 246 static int CeedBasisApplyAddAtPoints_Cuda(CeedBasis basis, const CeedInt num_elem, const CeedInt *n… in CeedBasisApplyAddAtPoints_Cuda() 255 static int CeedBasisApplyNonTensorCore_Cuda(CeedBasis basis, bool apply_add, const CeedInt num_elem… in CeedBasisApplyNonTensorCore_Cuda() 342 static int CeedBasisApplyNonTensor_Cuda(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode … in CeedBasisApplyNonTensor_Cuda() 348 static int CeedBasisApplyAddNonTensor_Cuda(CeedBasis basis, const CeedInt num_elem, CeedTransposeMo… in CeedBasisApplyAddNonTensor_Cuda()
|
| /libCEED/backends/memcheck/ |
| H A D | ceed-memcheck-restriction.c | 20 CeedInt elem_size, num_comp, num_elem; in CeedElemRestrictionGetBackendStrides_Memcheck() local 47 … CeedInt start, CeedInt stop, CeedInt num_elem, CeedInt elem_size, in CeedElemRestrictionApplyStridedNoTranspose_Memcheck_Core() 73 … const CeedInt comp_stride, CeedInt start, CeedInt stop, CeedInt num_elem, in CeedElemRestrictionApplyOffsetNoTranspose_Memcheck_Core() 92 … CeedInt stop, CeedInt num_elem, CeedInt elem_size, CeedSize v_offset, in CeedElemRestrictionApplyOrientedNoTranspose_Memcheck_Core() 111 … CeedInt stop, CeedInt num_elem, CeedInt elem_size, CeedSize v_offset, in CeedElemRestrictionApplyCurlOrientedNoTranspose_Memcheck_Core() 153 …CeedInt num_elem, CeedInt elem_size, CeedSize v_offset, const CeedScalar *__restrict__ uu, CeedSca… in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Memcheck_Core() 193 … CeedInt start, CeedInt stop, CeedInt num_elem, CeedInt elem_size, in CeedElemRestrictionApplyStridedTranspose_Memcheck_Core() 219 … const CeedInt comp_stride, CeedInt start, CeedInt stop, CeedInt num_elem, in CeedElemRestrictionApplyOffsetTranspose_Memcheck_Core() 243 … const CeedInt comp_stride, CeedInt start, CeedInt stop, CeedInt num_elem, in CeedElemRestrictionApplyOrientedTranspose_Memcheck_Core() 268 … CeedInt stop, CeedInt num_elem, CeedInt elem_size, CeedSize v_offset, in CeedElemRestrictionApplyCurlOrientedTranspose_Memcheck_Core() [all …]
|
| /libCEED/tests/ |
| H A D | t211-elemrestriction.c | 9 CeedInt num_elem = 3; in main() local
|
| H A D | t212-elemrestriction.c | 9 CeedInt num_elem = 3; in main() local
|
| H A D | t214-elemrestriction.c | 8 CeedInt num_elem = 3; in main() local
|
| H A D | t210-elemrestriction.c | 8 CeedInt num_elem = 3; in main() local
|
| H A D | t215-elemrestriction.c | 8 CeedInt num_elem = 3; in main() local
|
| H A D | t209-elemrestriction.c | 10 CeedInt num_elem = 3; in main() local
|
| H A D | t216-elemrestriction.c | 9 CeedInt num_elem = 3, comp_stride = 1; in main() local
|
| H A D | t230-elemrestriction.c | 8 CeedInt num_elem = 3, num_points = num_elem * 2; in main() local
|
| /libCEED/backends/cuda-shared/ |
| H A D | ceed-cuda-shared-basis.c | 24 …asisApplyTensorCore_Cuda_shared(CeedBasis basis, bool apply_add, const CeedInt num_elem, CeedTrans… in CeedBasisApplyTensorCore_Cuda_shared() 195 static int CeedBasisApplyTensor_Cuda_shared(CeedBasis basis, const CeedInt num_elem, CeedTransposeM… in CeedBasisApplyTensor_Cuda_shared() 201 static int CeedBasisApplyAddTensor_Cuda_shared(CeedBasis basis, const CeedInt num_elem, CeedTranspo… in CeedBasisApplyAddTensor_Cuda_shared() 210 …isApplyAtPointsCore_Cuda_shared(CeedBasis basis, bool apply_add, const CeedInt num_elem, const Cee… in CeedBasisApplyAtPointsCore_Cuda_shared() 433 static int CeedBasisApplyAtPoints_Cuda_shared(CeedBasis basis, const CeedInt num_elem, const CeedIn… in CeedBasisApplyAtPoints_Cuda_shared() 439 static int CeedBasisApplyAddAtPoints_Cuda_shared(CeedBasis basis, const CeedInt num_elem, const Cee… in CeedBasisApplyAddAtPoints_Cuda_shared() 448 …sApplyNonTensorCore_Cuda_shared(CeedBasis basis, bool apply_add, const CeedInt num_elem, CeedTrans… in CeedBasisApplyNonTensorCore_Cuda_shared() 556 static int CeedBasisApplyNonTensor_Cuda_shared(CeedBasis basis, const CeedInt num_elem, CeedTranspo… in CeedBasisApplyNonTensor_Cuda_shared() 562 static int CeedBasisApplyAddNonTensor_Cuda_shared(CeedBasis basis, const CeedInt num_elem, CeedTran… in CeedBasisApplyAddNonTensor_Cuda_shared()
|
| /libCEED/backends/sycl-ref/ |
| H A D | ceed-sycl-restriction.sycl.cpp | 30 const CeedInt num_elem = impl->num_elem; in CeedElemRestrictionStridedNoTranspose_Sycl() local 57 const CeedInt num_elem = impl->num_elem; in CeedElemRestrictionOffsetNoTranspose_Sycl() local 85 const CeedInt num_elem = impl->num_elem; in CeedElemRestrictionStridedTranspose_Sycl() local 114 const CeedInt num_elem = impl->num_elem; in CeedElemRestrictionOffsetTranspose_Sycl() local 254 …CeedInt num_elem, elem_size, num_comp, num_nodes = 0, *ind_to_offset, *l_vec_ind… in CeedElemRestrictionOffset_Sycl() local 343 CeedInt num_elem, num_comp, elem_size, comp_stride = 1; in CeedElemRestrictionCreate_Sycl() local
|
| /libCEED/backends/hip-shared/ |
| H A D | ceed-hip-shared-basis.c | 91 …BasisApplyTensorCore_Hip_shared(CeedBasis basis, bool apply_add, const CeedInt num_elem, CeedTrans… in CeedBasisApplyTensorCore_Hip_shared() 261 int CeedBasisApplyTensor_Hip_shared(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t_mo… in CeedBasisApplyTensor_Hip_shared() 267 int CeedBasisApplyAddTensor_Hip_shared(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t… in CeedBasisApplyAddTensor_Hip_shared() 276 …sisApplyAtPointsCore_Hip_shared(CeedBasis basis, bool apply_add, const CeedInt num_elem, const Cee… in CeedBasisApplyAtPointsCore_Hip_shared() 496 static int CeedBasisApplyAtPoints_Hip_shared(CeedBasis basis, const CeedInt num_elem, const CeedInt… in CeedBasisApplyAtPoints_Hip_shared() 502 static int CeedBasisApplyAddAtPoints_Hip_shared(CeedBasis basis, const CeedInt num_elem, const Ceed… in CeedBasisApplyAddAtPoints_Hip_shared() 511 …isApplyNonTensorCore_Hip_shared(CeedBasis basis, bool apply_add, const CeedInt num_elem, CeedTrans… in CeedBasisApplyNonTensorCore_Hip_shared() 617 int CeedBasisApplyNonTensor_Hip_shared(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t… in CeedBasisApplyNonTensor_Hip_shared() 623 int CeedBasisApplyAddNonTensor_Hip_shared(CeedBasis basis, const CeedInt num_elem, CeedTransposeMod… in CeedBasisApplyAddNonTensor_Hip_shared()
|