Home
last modified time | relevance | path

Searched defs:num_elem (Results 1 – 25 of 148) sorted by relevance

123456

/libCEED/include/ceed/jit-source/hip/
H A Dhip-ref-basis-nontensor.h21 extern "C" __global__ void Interp(const CeedInt num_elem, const CeedScalar *__restrict__ d_B, const… in Interp()
29 extern "C" __global__ void InterpTranspose(const CeedInt num_elem, const CeedScalar *__restrict__ d… in InterpTranspose()
40 extern "C" __global__ void Deriv(const CeedInt num_elem, const CeedScalar *__restrict__ d_B, const … in Deriv()
48 extern "C" __global__ void DerivTranspose(const CeedInt num_elem, const CeedScalar *__restrict__ d_… in DerivTranspose()
59 extern "C" __global__ void Weight(const CeedInt num_elem, const CeedScalar *__restrict__ q_weight, … in Weight()
H A Dhip-ref-basis-tensor.h19 extern "C" __global__ void Interp(const CeedInt num_elem, const CeedInt is_transpose, const CeedSca… in Interp()
77 extern "C" __global__ void Grad(const CeedInt num_elem, const CeedInt is_transpose, const CeedScala… in Grad()
142 __device__ void Weight1d(const CeedInt num_elem, const CeedScalar *q_weight_1d, CeedScalar *w) { in Weight1d()
155 __device__ void Weight2d(const CeedInt num_elem, const CeedScalar *q_weight_1d, CeedScalar *w) { in Weight2d()
173 __device__ void Weight3d(const CeedInt num_elem, const CeedScalar *q_weight_1d, CeedScalar *w) { in Weight3d()
193 extern "C" __global__ void Weight(const CeedInt num_elem, const CeedScalar *__restrict__ q_weight_1… in Weight()
/libCEED/include/ceed/jit-source/cuda/
H A Dcuda-ref-basis-nontensor.h21 extern "C" __global__ void Interp(const CeedInt num_elem, const CeedScalar *__restrict__ d_B, const… in Interp()
29 extern "C" __global__ void InterpTranspose(const CeedInt num_elem, const CeedScalar *__restrict__ d… in InterpTranspose()
40 extern "C" __global__ void Deriv(const CeedInt num_elem, const CeedScalar *__restrict__ d_B, const … in Deriv()
48 extern "C" __global__ void DerivTranspose(const CeedInt num_elem, const CeedScalar *__restrict__ d_… in DerivTranspose()
59 extern "C" __global__ void Weight(const CeedInt num_elem, const CeedScalar *__restrict__ q_weight, … in Weight()
H A Dcuda-shared-basis-tensor.h18 extern "C" __global__ void Interp(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *… in Interp()
56 extern "C" __global__ void InterpCollocated(const CeedInt num_elem, const CeedScalar *c_B, const Ce… in InterpCollocated()
86 extern "C" __global__ void InterpTranspose(const CeedInt num_elem, const CeedScalar *c_B, const Cee… in InterpTranspose()
125 extern "C" __global__ void InterpCollocatedTranspose(const CeedInt num_elem, const CeedScalar *c_B,… in InterpCollocatedTranspose()
155 extern "C" __global__ void InterpTransposeAdd(const CeedInt num_elem, const CeedScalar *c_B, const … in InterpTransposeAdd()
194 extern "C" __global__ void InterpCollocatedTransposeAdd(const CeedInt num_elem, const CeedScalar *c… in InterpCollocatedTransposeAdd()
227 extern "C" __global__ void Grad(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *c_… in Grad()
270 extern "C" __global__ void GradCollocated(const CeedInt num_elem, const CeedScalar *c_B, const Ceed… in GradCollocated()
310 extern "C" __global__ void GradTranspose(const CeedInt num_elem, const CeedScalar *c_B, const CeedS… in GradTranspose()
353 extern "C" __global__ void GradCollocatedTranspose(const CeedInt num_elem, const CeedScalar *c_B, c… in GradCollocatedTranspose()
[all …]
H A Dcuda-shared-basis-nontensor.h18 extern "C" __global__ void Interp(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *… in Interp()
44 extern "C" __global__ void InterpTranspose(const CeedInt num_elem, const CeedScalar *c_B, const Cee… in InterpTranspose()
71 extern "C" __global__ void InterpTransposeAdd(const CeedInt num_elem, const CeedScalar *c_B, const … in InterpTransposeAdd()
101 extern "C" __global__ void Grad(const CeedInt num_elem, const CeedScalar *c_G, const CeedScalar *__… in Grad()
127 extern "C" __global__ void GradTranspose(const CeedInt num_elem, const CeedScalar *c_G, const CeedS… in GradTranspose()
154 extern "C" __global__ void GradTransposeAdd(const CeedInt num_elem, const CeedScalar *c_G, const Ce… in GradTransposeAdd()
184 extern "C" __global__ void Weight(const CeedInt num_elem, const CeedScalar *__restrict__ q_weight, … in Weight()
H A Dcuda-shared-basis-tensor-at-points.h23 extern "C" __global__ void InterpAtPoints(const CeedInt num_elem, const CeedScalar *__restrict__ c_… in InterpAtPoints()
78 extern "C" __global__ void InterpTransposeAtPoints(const CeedInt num_elem, const CeedScalar *__rest… in InterpTransposeAtPoints()
148 extern "C" __global__ void InterpTransposeAddAtPoints(const CeedInt num_elem, const CeedScalar *__r… in InterpTransposeAddAtPoints()
210 extern "C" __global__ void GradAtPoints(const CeedInt num_elem, const CeedScalar *__restrict__ c_B,… in GradAtPoints()
265 extern "C" __global__ void GradTransposeAtPoints(const CeedInt num_elem, const CeedScalar *__restri… in GradTransposeAtPoints()
336 extern "C" __global__ void GradTransposeAddAtPoints(const CeedInt num_elem, const CeedScalar *__res… in GradTransposeAddAtPoints()
H A Dcuda-ref-basis-tensor.h19 extern "C" __global__ void Interp(const CeedInt num_elem, const CeedInt is_transpose, const CeedSca… in Interp()
77 extern "C" __global__ void Grad(const CeedInt num_elem, const CeedInt is_transpose, const CeedScala… in Grad()
142 __device__ void Weight1d(const CeedInt num_elem, const CeedScalar *q_weight_1d, CeedScalar *w) { in Weight1d()
155 __device__ void Weight2d(const CeedInt num_elem, const CeedScalar *q_weight_1d, CeedScalar *w) { in Weight2d()
173 __device__ void Weight3d(const CeedInt num_elem, const CeedScalar *q_weight_1d, CeedScalar *w) { in Weight3d()
193 extern "C" __global__ void Weight(const CeedInt num_elem, const CeedScalar *__restrict__ q_weight_1… in Weight()
/libCEED/include/ceed/jit-source/sycl/
H A Dsycl-shared-basis-tensor.h22 kernel void Interp(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, global co… in Interp()
53 kernel void InterpTranspose(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, … in InterpTranspose()
90 kernel void Grad(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, global cons… in Grad()
125 kernel void GradTranspose(const CeedInt num_elem, global const CeedScalar *restrict d_interp_1d, gl… in GradTranspose()
163 kernel void Weight(const CeedInt num_elem, global const CeedScalar *restrict q_weight_1d, global Ce… in Weight()
H A Dsycl-gen-templates.h33 …t1d(const CeedInt num_comp, const CeedInt strides_comp, const CeedInt P_1D, const CeedInt num_elem, in readDofsOffset1d()
51 … const CeedInt strides_elem, const CeedInt num_elem, global const CeedScalar *restrict d_u, in readDofsStrided1d()
68 …t1d(const CeedInt num_comp, const CeedInt strides_comp, const CeedInt P_1D, const CeedInt num_elem, in writeDofsOffset1d()
85 … const CeedInt strides_elem, const CeedInt num_elem, private const CeedScalar *restrict r_v, in writeDofsStrided1d()
106 …t2d(const CeedInt num_comp, const CeedInt strides_comp, const CeedInt P_1D, const CeedInt num_elem, in readDofsOffset2d()
123 … const CeedInt strides_elem, const CeedInt num_elem, const global CeedScalar *restrict d_u, in readDofsStrided2d()
139 …t2d(const CeedInt num_comp, const CeedInt strides_comp, const CeedInt P_1D, const CeedInt num_elem, in writeDofsOffset2d()
157 … const CeedInt strides_elem, const CeedInt num_elem, const private CeedScalar *restrict r_v, in writeDofsStrided2d()
177 …t3d(const CeedInt num_comp, const CeedInt strides_comp, const CeedInt P_1D, const CeedInt num_elem, in readDofsOffset3d()
196 … const CeedInt strides_elem, const CeedInt num_elem, const global CeedScalar *restrict d_u, in readDofsStrided3d()
[all …]
H A Dsycl-shared-basis-read-write-templates.h28 inline void ReadElementStrided1d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_elem in ReadElementStrided1d()
46 …riteElementStrided1d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_elem, const Cee… in WriteElementStrided1d()
68 inline void ReadElementStrided2d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_elem in ReadElementStrided2d()
87 …riteElementStrided2d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_elem, const Cee… in WriteElementStrided2d()
110 inline void ReadElementStrided3d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_elem in ReadElementStrided3d()
131 …riteElementStrided3d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_elem, const Cee… in WriteElementStrided3d()
/libCEED/interface/
H A Dceed-elemrestriction.c38 …(const CeedInt *offsets, CeedInt *block_offsets, CeedInt num_block, CeedInt num_elem, CeedInt bloc… in CeedPermutePadOffsets()
64 …rients(const bool *orients, bool *block_orients, CeedInt num_block, CeedInt num_elem, CeedInt bloc… in CeedPermutePadOrients()
89 …nt8 *curl_orients, CeedInt8 *block_curl_orients, CeedInt num_block, CeedInt num_elem, CeedInt bloc… in CeedPermutePadCurlOrients()
657 int CeedElemRestrictionCreate(Ceed ceed, CeedInt num_elem, CeedInt elem_size, CeedInt num_comp, Cee… in CeedElemRestrictionCreate()
712 int CeedElemRestrictionCreateOriented(Ceed ceed, CeedInt num_elem, CeedInt elem_size, CeedInt num_c… in CeedElemRestrictionCreateOriented()
770 int CeedElemRestrictionCreateCurlOriented(Ceed ceed, CeedInt num_elem, CeedInt elem_size, CeedInt n… in CeedElemRestrictionCreateCurlOriented()
824 int CeedElemRestrictionCreateStrided(Ceed ceed, CeedInt num_elem, CeedInt elem_size, CeedInt num_co… in CeedElemRestrictionCreateStrided()
891 int CeedElemRestrictionCreateAtPoints(Ceed ceed, CeedInt num_elem, CeedInt num_points, CeedInt num_… in CeedElemRestrictionCreateAtPoints()
950 int CeedElemRestrictionCreateBlocked(Ceed ceed, CeedInt num_elem, CeedInt elem_size, CeedInt block_… in CeedElemRestrictionCreateBlocked()
1018 int CeedElemRestrictionCreateBlockedOriented(Ceed ceed, CeedInt num_elem, CeedInt elem_size, CeedIn… in CeedElemRestrictionCreateBlockedOriented()
[all …]
/libCEED/backends/hip-ref/
H A Dceed-hip-ref-basis.c21 static int CeedBasisApplyCore_Hip(CeedBasis basis, bool apply_add, const CeedInt num_elem, CeedTran… in CeedBasisApplyCore_Hip()
87 static int CeedBasisApply_Hip(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t_mode, Ce… in CeedBasisApply_Hip()
92 static int CeedBasisApplyAdd_Hip(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t_mode,… in CeedBasisApplyAdd_Hip()
101 static int CeedBasisApplyAtPointsCore_Hip(CeedBasis basis, bool apply_add, const CeedInt num_elem, … in CeedBasisApplyAtPointsCore_Hip()
239 static int CeedBasisApplyAtPoints_Hip(CeedBasis basis, const CeedInt num_elem, const CeedInt *num_p… in CeedBasisApplyAtPoints_Hip()
245 static int CeedBasisApplyAddAtPoints_Hip(CeedBasis basis, const CeedInt num_elem, const CeedInt *nu… in CeedBasisApplyAddAtPoints_Hip()
254 static int CeedBasisApplyNonTensorCore_Hip(CeedBasis basis, bool apply_add, const CeedInt num_elem,… in CeedBasisApplyNonTensorCore_Hip()
341 static int CeedBasisApplyNonTensor_Hip(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t… in CeedBasisApplyNonTensor_Hip()
347 static int CeedBasisApplyAddNonTensor_Hip(CeedBasis basis, const CeedInt num_elem, CeedTransposeMod… in CeedBasisApplyAddNonTensor_Hip()
/libCEED/backends/cuda-ref/
H A Dceed-cuda-ref-basis.c22 static int CeedBasisApplyCore_Cuda(CeedBasis basis, bool apply_add, const CeedInt num_elem, CeedTra… in CeedBasisApplyCore_Cuda()
87 static int CeedBasisApply_Cuda(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t_mode, C… in CeedBasisApply_Cuda()
93 static int CeedBasisApplyAdd_Cuda(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t_mode… in CeedBasisApplyAdd_Cuda()
102 static int CeedBasisApplyAtPointsCore_Cuda(CeedBasis basis, bool apply_add, const CeedInt num_elem,… in CeedBasisApplyAtPointsCore_Cuda()
240 static int CeedBasisApplyAtPoints_Cuda(CeedBasis basis, const CeedInt num_elem, const CeedInt *num_… in CeedBasisApplyAtPoints_Cuda()
246 static int CeedBasisApplyAddAtPoints_Cuda(CeedBasis basis, const CeedInt num_elem, const CeedInt *n… in CeedBasisApplyAddAtPoints_Cuda()
255 static int CeedBasisApplyNonTensorCore_Cuda(CeedBasis basis, bool apply_add, const CeedInt num_elem in CeedBasisApplyNonTensorCore_Cuda()
342 static int CeedBasisApplyNonTensor_Cuda(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode … in CeedBasisApplyNonTensor_Cuda()
348 static int CeedBasisApplyAddNonTensor_Cuda(CeedBasis basis, const CeedInt num_elem, CeedTransposeMo… in CeedBasisApplyAddNonTensor_Cuda()
/libCEED/backends/memcheck/
H A Dceed-memcheck-restriction.c20 CeedInt elem_size, num_comp, num_elem; in CeedElemRestrictionGetBackendStrides_Memcheck() local
47 … CeedInt start, CeedInt stop, CeedInt num_elem, CeedInt elem_size, in CeedElemRestrictionApplyStridedNoTranspose_Memcheck_Core()
73 … const CeedInt comp_stride, CeedInt start, CeedInt stop, CeedInt num_elem, in CeedElemRestrictionApplyOffsetNoTranspose_Memcheck_Core()
92 … CeedInt stop, CeedInt num_elem, CeedInt elem_size, CeedSize v_offset, in CeedElemRestrictionApplyOrientedNoTranspose_Memcheck_Core()
111 … CeedInt stop, CeedInt num_elem, CeedInt elem_size, CeedSize v_offset, in CeedElemRestrictionApplyCurlOrientedNoTranspose_Memcheck_Core()
153CeedInt num_elem, CeedInt elem_size, CeedSize v_offset, const CeedScalar *__restrict__ uu, CeedSca… in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Memcheck_Core()
193 … CeedInt start, CeedInt stop, CeedInt num_elem, CeedInt elem_size, in CeedElemRestrictionApplyStridedTranspose_Memcheck_Core()
219 … const CeedInt comp_stride, CeedInt start, CeedInt stop, CeedInt num_elem, in CeedElemRestrictionApplyOffsetTranspose_Memcheck_Core()
243 … const CeedInt comp_stride, CeedInt start, CeedInt stop, CeedInt num_elem, in CeedElemRestrictionApplyOrientedTranspose_Memcheck_Core()
268 … CeedInt stop, CeedInt num_elem, CeedInt elem_size, CeedSize v_offset, in CeedElemRestrictionApplyCurlOrientedTranspose_Memcheck_Core()
[all …]
/libCEED/tests/
H A Dt211-elemrestriction.c9 CeedInt num_elem = 3; in main() local
H A Dt212-elemrestriction.c9 CeedInt num_elem = 3; in main() local
H A Dt214-elemrestriction.c8 CeedInt num_elem = 3; in main() local
H A Dt210-elemrestriction.c8 CeedInt num_elem = 3; in main() local
H A Dt215-elemrestriction.c8 CeedInt num_elem = 3; in main() local
H A Dt209-elemrestriction.c10 CeedInt num_elem = 3; in main() local
H A Dt216-elemrestriction.c9 CeedInt num_elem = 3, comp_stride = 1; in main() local
H A Dt230-elemrestriction.c8 CeedInt num_elem = 3, num_points = num_elem * 2; in main() local
/libCEED/backends/cuda-shared/
H A Dceed-cuda-shared-basis.c24 …asisApplyTensorCore_Cuda_shared(CeedBasis basis, bool apply_add, const CeedInt num_elem, CeedTrans… in CeedBasisApplyTensorCore_Cuda_shared()
195 static int CeedBasisApplyTensor_Cuda_shared(CeedBasis basis, const CeedInt num_elem, CeedTransposeM… in CeedBasisApplyTensor_Cuda_shared()
201 static int CeedBasisApplyAddTensor_Cuda_shared(CeedBasis basis, const CeedInt num_elem, CeedTranspo… in CeedBasisApplyAddTensor_Cuda_shared()
210 …isApplyAtPointsCore_Cuda_shared(CeedBasis basis, bool apply_add, const CeedInt num_elem, const Cee… in CeedBasisApplyAtPointsCore_Cuda_shared()
433 static int CeedBasisApplyAtPoints_Cuda_shared(CeedBasis basis, const CeedInt num_elem, const CeedIn… in CeedBasisApplyAtPoints_Cuda_shared()
439 static int CeedBasisApplyAddAtPoints_Cuda_shared(CeedBasis basis, const CeedInt num_elem, const Cee… in CeedBasisApplyAddAtPoints_Cuda_shared()
448 …sApplyNonTensorCore_Cuda_shared(CeedBasis basis, bool apply_add, const CeedInt num_elem, CeedTrans… in CeedBasisApplyNonTensorCore_Cuda_shared()
556 static int CeedBasisApplyNonTensor_Cuda_shared(CeedBasis basis, const CeedInt num_elem, CeedTranspo… in CeedBasisApplyNonTensor_Cuda_shared()
562 static int CeedBasisApplyAddNonTensor_Cuda_shared(CeedBasis basis, const CeedInt num_elem, CeedTran… in CeedBasisApplyAddNonTensor_Cuda_shared()
/libCEED/backends/sycl-ref/
H A Dceed-sycl-restriction.sycl.cpp30 const CeedInt num_elem = impl->num_elem; in CeedElemRestrictionStridedNoTranspose_Sycl() local
57 const CeedInt num_elem = impl->num_elem; in CeedElemRestrictionOffsetNoTranspose_Sycl() local
85 const CeedInt num_elem = impl->num_elem; in CeedElemRestrictionStridedTranspose_Sycl() local
114 const CeedInt num_elem = impl->num_elem; in CeedElemRestrictionOffsetTranspose_Sycl() local
254 …CeedInt num_elem, elem_size, num_comp, num_nodes = 0, *ind_to_offset, *l_vec_ind… in CeedElemRestrictionOffset_Sycl() local
343 CeedInt num_elem, num_comp, elem_size, comp_stride = 1; in CeedElemRestrictionCreate_Sycl() local
/libCEED/backends/hip-shared/
H A Dceed-hip-shared-basis.c91 …BasisApplyTensorCore_Hip_shared(CeedBasis basis, bool apply_add, const CeedInt num_elem, CeedTrans… in CeedBasisApplyTensorCore_Hip_shared()
261 int CeedBasisApplyTensor_Hip_shared(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t_mo… in CeedBasisApplyTensor_Hip_shared()
267 int CeedBasisApplyAddTensor_Hip_shared(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t… in CeedBasisApplyAddTensor_Hip_shared()
276 …sisApplyAtPointsCore_Hip_shared(CeedBasis basis, bool apply_add, const CeedInt num_elem, const Cee… in CeedBasisApplyAtPointsCore_Hip_shared()
496 static int CeedBasisApplyAtPoints_Hip_shared(CeedBasis basis, const CeedInt num_elem, const CeedInt… in CeedBasisApplyAtPoints_Hip_shared()
502 static int CeedBasisApplyAddAtPoints_Hip_shared(CeedBasis basis, const CeedInt num_elem, const Ceed… in CeedBasisApplyAddAtPoints_Hip_shared()
511 …isApplyNonTensorCore_Hip_shared(CeedBasis basis, bool apply_add, const CeedInt num_elem, CeedTrans… in CeedBasisApplyNonTensorCore_Hip_shared()
617 int CeedBasisApplyNonTensor_Hip_shared(CeedBasis basis, const CeedInt num_elem, CeedTransposeMode t… in CeedBasisApplyNonTensor_Hip_shared()
623 int CeedBasisApplyAddNonTensor_Hip_shared(CeedBasis basis, const CeedInt num_elem, CeedTransposeMod… in CeedBasisApplyAddNonTensor_Hip_shared()

123456