| /libCEED/include/ceed/jit-source/cuda/ |
| H A D | cuda-shared-basis-tensor-templates.h | 20 inline __device__ void ContractX1d(SharedData_Cuda &data, const CeedScalar *U, const CeedScalar *B,… in ContractX1d() 36 inline __device__ void ContractTransposeX1d(SharedData_Cuda &data, const CeedScalar *U, const CeedS… in ContractTransposeX1d() 52 inline __device__ void Interp1d(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const Ce… in Interp1d() 62 inline __device__ void InterpTranspose1d(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U,… in InterpTranspose1d() 73 inline __device__ void InterpCollocatedNodes1d(SharedData_Cuda &data, const CeedScalar *__restrict_… in InterpCollocatedNodes1d() 84 inline __device__ void InterpTransposeCollocatedNodes1d(SharedData_Cuda &data, const CeedScalar *__… in InterpTransposeCollocatedNodes1d() 95 inline __device__ void Grad1d(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const Ceed… in Grad1d() 106 inline __device__ void GradTranspose1d(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, c… in GradTranspose1d() 117 inline __device__ void Weight1d(SharedData_Cuda &data, const CeedScalar *__restrict__ q_weight_1d, … in Weight1d() 129 inline __device__ void ContractX2d(SharedData_Cuda &data, const CeedScalar *U, const CeedScalar *B,… in ContractX2d() [all …]
|
| H A D | cuda-shared-basis-nontensor-templates.h | 16 inline __device__ void Contract1d(SharedData_Cuda &data, const CeedScalar *U, const CeedScalar *B, … in Contract1d() 32 inline __device__ void ContractTranspose1d(SharedData_Cuda &data, const CeedScalar *U, const CeedSc… in ContractTranspose1d() 47 inline __device__ void InterpNonTensor(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, c… in InterpNonTensor() 58 inline __device__ void InterpTransposeNonTensor(SharedData_Cuda &data, const CeedScalar *__restrict… in InterpTransposeNonTensor() 70 inline __device__ void GradNonTensor(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, con… in GradNonTensor() 82 inline __device__ void GradTransposeNonTensor(SharedData_Cuda &data, const CeedScalar *__restrict__… in GradTransposeNonTensor() 96 inline __device__ void WeightNonTensor(SharedData_Cuda &data, const CeedScalar *__restrict__ q_weig… in WeightNonTensor()
|
| H A D | cuda-shared-basis-tensor-flattened-templates.h | 20 inline __device__ void ContractX2dFlattened(SharedData_Cuda &data, const int t_id_x, const int t_id… in ContractX2dFlattened() 37 inline __device__ void ContractY2dFlattened(SharedData_Cuda &data, const int t_id_x, const int t_id… in ContractY2dFlattened() 54 inline __device__ void ContractTransposeY2dFlattened(SharedData_Cuda &data, const int t_id_x, const… in ContractTransposeY2dFlattened() 71 inline __device__ void ContractTransposeX2dFlattened(SharedData_Cuda &data, const int t_id_x, const… in ContractTransposeX2dFlattened() 88 inline __device__ void ContractTransposeAddX2dFlattened(SharedData_Cuda &data, const int t_id_x, co… in ContractTransposeAddX2dFlattened() 104 inline __device__ void QPack2d(SharedData_Cuda &data, const int t_id_x, const int t_id_y, CeedScala… in QPack2d() 116 inline __device__ void QUnpack2d(SharedData_Cuda &data, const int t_id_x, const int t_id_y, CeedSca… in QUnpack2d() 131 inline __device__ void InterpTensor2dFlattened(SharedData_Cuda &data, CeedScalar *__restrict__ r_U,… in InterpTensor2dFlattened() 150 inline __device__ void InterpTransposeTensor2dFlattened(SharedData_Cuda &data, CeedScalar *__restri… in InterpTransposeTensor2dFlattened() 168 inline __device__ void InterpTensorCollocatedNodes2dFlattened(SharedData_Cuda &data, CeedScalar *__… in InterpTensorCollocatedNodes2dFlattened() [all …]
|
| H A D | cuda-gen-templates.h | 16 inline __device__ void LoadMatrix(SharedData_Cuda &data, const CeedScalar *__restrict__ d_B, CeedSc… in LoadMatrix() 28 inline __device__ void ReadPoint(SharedData_Cuda &data, const CeedInt elem, const CeedInt p, const … in ReadPoint() 41 inline __device__ void WritePoint(SharedData_Cuda &data, const CeedInt elem, const CeedInt p, const… in WritePoint() 60 inline __device__ void SetEVecStandard1d_Single(SharedData_Cuda &data, const CeedInt n, const CeedS… in SetEVecStandard1d_Single() 73 inline __device__ void ReadLVecStandard1d(SharedData_Cuda &data, const CeedInt num_nodes, const Cee… in ReadLVecStandard1d() 87 inline __device__ void ReadLVecStrided1d(SharedData_Cuda &data, const CeedInt elem, const CeedScala… in ReadLVecStrided1d() 101 inline __device__ void WriteLVecStandard1d(SharedData_Cuda &data, const CeedInt num_nodes, const Ce… in WriteLVecStandard1d() 112 inline __device__ void WriteLVecStandard1d_Single(SharedData_Cuda &data, const CeedInt num_nodes, c… in WriteLVecStandard1d_Single() 129 inline __device__ void WriteLVecStandard1d_Assembly(SharedData_Cuda &data, const CeedInt num_nodes,… in WriteLVecStandard1d_Assembly() 148 inline __device__ void WriteLVecStandard1d_QFAssembly(SharedData_Cuda &data, const CeedInt num_elem… in WriteLVecStandard1d_QFAssembly() [all …]
|
| H A D | cuda-shared-basis-tensor.h | 21 SharedData_Cuda data; in Interp() local 60 SharedData_Cuda data; in InterpCollocated() local 90 SharedData_Cuda data; in InterpTranspose() local 129 SharedData_Cuda data; in InterpCollocatedTranspose() local 159 SharedData_Cuda data; in InterpTransposeAdd() local 198 SharedData_Cuda data; in InterpCollocatedTransposeAdd() local 231 SharedData_Cuda data; in Grad() local 274 SharedData_Cuda data; in GradCollocated() local 314 SharedData_Cuda data; in GradTranspose() local 357 SharedData_Cuda data; in GradCollocatedTranspose() local [all …]
|
| H A D | cuda-shared-basis-nontensor.h | 21 SharedData_Cuda data; in Interp() local 48 SharedData_Cuda data; in InterpTranspose() local 75 SharedData_Cuda data; in InterpTransposeAdd() local 104 SharedData_Cuda data; in Grad() local 131 SharedData_Cuda data; in GradTranspose() local 158 SharedData_Cuda data; in GradTransposeAdd() local 187 SharedData_Cuda data; in Weight() local
|
| H A D | cuda-shared-basis-read-write-templates.h | 16 inline __device__ void LoadMatrix(SharedData_Cuda &data, const CeedScalar *__restrict__ d_B, CeedSc… in LoadMatrix() 28 inline __device__ void ReadElementStrided1d(SharedData_Cuda &data, const CeedInt elem, const CeedIn… in ReadElementStrided1d() 44 inline __device__ void WriteElementStrided1d(SharedData_Cuda &data, const CeedInt elem, const CeedI… in WriteElementStrided1d() 57 inline __device__ void SumElementStrided1d(SharedData_Cuda &data, const CeedInt elem, const CeedInt… in SumElementStrided1d() 77 inline __device__ void ReadElementStrided2d(SharedData_Cuda &data, const CeedInt elem, const CeedIn… in ReadElementStrided2d() 93 inline __device__ void WriteElementStrided2d(SharedData_Cuda &data, const CeedInt elem, const CeedI… in WriteElementStrided2d() 106 inline __device__ void SumElementStrided2d(SharedData_Cuda &data, const CeedInt elem, const CeedInt… in SumElementStrided2d() 126 inline __device__ void ReadElementStrided3d(SharedData_Cuda &data, const CeedInt elem, const CeedIn… in ReadElementStrided3d() 144 inline __device__ void WriteElementStrided3d(SharedData_Cuda &data, const CeedInt elem, const CeedI… in WriteElementStrided3d() 159 inline __device__ void SumElementStrided3d(SharedData_Cuda &data, const CeedInt elem, const CeedInt… in SumElementStrided3d() [all …]
|
| /libCEED/include/ceed/jit-source/hip/ |
| H A D | hip-shared-basis-tensor-templates.h | 20 inline __device__ void ContractX1d(SharedData_Hip &data, const CeedScalar *U, const CeedScalar *B, … in ContractX1d() 36 inline __device__ void ContractTransposeX1d(SharedData_Hip &data, const CeedScalar *U, const CeedSc… in ContractTransposeX1d() 52 inline __device__ void Interp1d(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const Cee… in Interp1d() 62 inline __device__ void InterpTranspose1d(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, … in InterpTranspose1d() 73 inline __device__ void InterpCollocatedNodes1d(SharedData_Hip &data, const CeedScalar *__restrict__… in InterpCollocatedNodes1d() 84 inline __device__ void InterpTransposeCollocatedNodes1d(SharedData_Hip &data, const CeedScalar *__r… in InterpTransposeCollocatedNodes1d() 95 inline __device__ void Grad1d(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedS… in Grad1d() 106 inline __device__ void GradTranspose1d(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, co… in GradTranspose1d() 117 inline __device__ void Weight1d(SharedData_Hip &data, const CeedScalar *__restrict__ q_weight_1d, C… in Weight1d() 129 inline __device__ void ContractX2d(SharedData_Hip &data, const CeedScalar *U, const CeedScalar *B, … in ContractX2d() [all …]
|
| H A D | hip-shared-basis-tensor.h | 22 SharedData_Hip data; in __launch_bounds__() local 61 SharedData_Hip data; in __launch_bounds__() local 91 SharedData_Hip data; in __launch_bounds__() local 130 SharedData_Hip data; in __launch_bounds__() local 160 SharedData_Hip data; in __launch_bounds__() local 200 SharedData_Hip data; in __launch_bounds__() local 233 SharedData_Hip data; in __launch_bounds__() local 277 SharedData_Hip data; in __launch_bounds__() local 318 SharedData_Hip data; in __launch_bounds__() local 362 SharedData_Hip data; in __launch_bounds__() local [all …]
|
| H A D | hip-shared-basis-nontensor-templates.h | 16 inline __device__ void Contract1d(SharedData_Hip &data, const CeedScalar *U, const CeedScalar *B, C… in Contract1d() 32 inline __device__ void ContractTranspose1d(SharedData_Hip &data, const CeedScalar *U, const CeedSca… in ContractTranspose1d() 47 inline __device__ void InterpNonTensor(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, co… in InterpNonTensor() 58 inline __device__ void InterpTransposeNonTensor(SharedData_Hip &data, const CeedScalar *__restrict_… in InterpTransposeNonTensor() 70 inline __device__ void GradNonTensor(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, cons… in GradNonTensor() 82 inline __device__ void GradTransposeNonTensor(SharedData_Hip &data, const CeedScalar *__restrict__ … in GradTransposeNonTensor() 96 inline __device__ void WeightNonTensor(SharedData_Hip &data, const CeedScalar *__restrict__ q_weigh… in WeightNonTensor()
|
| H A D | hip-shared-basis-nontensor.h | 22 SharedData_Hip data; in __launch_bounds__() local 49 SharedData_Hip data; in __launch_bounds__() local 76 SharedData_Hip data; in __launch_bounds__() local 106 SharedData_Hip data; in __launch_bounds__() local 133 SharedData_Hip data; in __launch_bounds__() local 160 SharedData_Hip data; in __launch_bounds__() local 190 SharedData_Hip data; in __launch_bounds__() local
|
| H A D | hip-shared-basis-tensor-flattened-templates.h | 20 inline __device__ void ContractX2dFlattened(SharedData_Hip &data, const int t_id_x, const int t_id_… in ContractX2dFlattened() 37 inline __device__ void ContractY2dFlattened(SharedData_Hip &data, const int t_id_x, const int t_id_… in ContractY2dFlattened() 54 inline __device__ void ContractTransposeY2dFlattened(SharedData_Hip &data, const int t_id_x, const … in ContractTransposeY2dFlattened() 71 inline __device__ void ContractTransposeX2dFlattened(SharedData_Hip &data, const int t_id_x, const … in ContractTransposeX2dFlattened() 88 inline __device__ void ContractTransposeAddX2dFlattened(SharedData_Hip &data, const int t_id_x, con… in ContractTransposeAddX2dFlattened() 104 inline __device__ void QPack2d(SharedData_Hip &data, const int t_id_x, const int t_id_y, CeedScalar… in QPack2d() 116 inline __device__ void QUnpack2d(SharedData_Hip &data, const int t_id_x, const int t_id_y, CeedScal… in QUnpack2d() 131 inline __device__ void InterpTensor2dFlattened(SharedData_Hip &data, CeedScalar *__restrict__ r_U, … in InterpTensor2dFlattened() 150 inline __device__ void InterpTransposeTensor2dFlattened(SharedData_Hip &data, CeedScalar *__restric… in InterpTransposeTensor2dFlattened() 168 inline __device__ void InterpTensorCollocatedNodes2dFlattened(SharedData_Hip &data, CeedScalar *__r… in InterpTensorCollocatedNodes2dFlattened() [all …]
|
| H A D | hip-gen-templates.h | 16 inline __device__ void LoadMatrix(SharedData_Hip &data, const CeedScalar *__restrict__ d_B, CeedSca… in LoadMatrix() 28 inline __device__ void ReadPoint(SharedData_Hip &data, const CeedInt elem, const CeedInt p, const C… in ReadPoint() 41 inline __device__ void WritePoint(SharedData_Hip &data, const CeedInt elem, const CeedInt p, const … in WritePoint() 60 inline __device__ void SetEVecStandard1d_Single(SharedData_Hip &data, const CeedInt n, const CeedSc… in SetEVecStandard1d_Single() 73 inline __device__ void ReadLVecStandard1d(SharedData_Hip &data, const CeedInt num_nodes, const Ceed… in ReadLVecStandard1d() 87 inline __device__ void ReadLVecStrided1d(SharedData_Hip &data, const CeedInt elem, const CeedScalar… in ReadLVecStrided1d() 100 inline __device__ void WriteLVecStandard1d(SharedData_Hip &data, const CeedInt num_nodes, const Cee… in WriteLVecStandard1d() 111 inline __device__ void WriteLVecStandard1d_Single(SharedData_Hip &data, const CeedInt num_nodes, co… in WriteLVecStandard1d_Single() 128 inline __device__ void WriteLVecStandard1d_Assembly(SharedData_Hip &data, const CeedInt num_nodes, … in WriteLVecStandard1d_Assembly() 147 inline __device__ void WriteLVecStandard1d_QFAssembly(SharedData_Hip &data, const CeedInt num_elem,… in WriteLVecStandard1d_QFAssembly() [all …]
|
| H A D | hip-shared-basis-read-write-templates.h | 16 inline __device__ void LoadMatrix(SharedData_Hip &data, const CeedScalar *__restrict__ d_B, CeedSca… in LoadMatrix() 28 inline __device__ void ReadElementStrided1d(SharedData_Hip &data, const CeedInt elem, const CeedInt… in ReadElementStrided1d() 44 inline __device__ void WriteElementStrided1d(SharedData_Hip &data, const CeedInt elem, const CeedIn… in WriteElementStrided1d() 57 inline __device__ void SumElementStrided1d(SharedData_Hip &data, const CeedInt elem, const CeedInt … in SumElementStrided1d() 77 inline __device__ void ReadElementStrided2d(SharedData_Hip &data, const CeedInt elem, const CeedInt… in ReadElementStrided2d() 93 inline __device__ void WriteElementStrided2d(SharedData_Hip &data, const CeedInt elem, const CeedIn… in WriteElementStrided2d() 106 inline __device__ void SumElementStrided2d(SharedData_Hip &data, const CeedInt elem, const CeedInt … in SumElementStrided2d() 126 inline __device__ void ReadElementStrided3d(SharedData_Hip &data, const CeedInt elem, const CeedInt… in ReadElementStrided3d() 144 inline __device__ void WriteElementStrided3d(SharedData_Hip &data, const CeedInt elem, const CeedIn… in WriteElementStrided3d() 159 inline __device__ void SumElementStrided3d(SharedData_Hip &data, const CeedInt elem, const CeedInt … in SumElementStrided3d() [all …]
|
| /libCEED/backends/cuda-ref/ |
| H A D | ceed-cuda-ref-qfunction.c | 25 CeedQFunction_Cuda *data; in CeedQFunctionApply_Cuda() local 69 CeedQFunction_Cuda *data; in CeedQFunctionDestroy_Cuda() local 81 CeedQFunction_Cuda *data; in CeedQFunctionSetCUDAUserFunction_Cuda() local 93 CeedQFunction_Cuda *data; in CeedQFunctionCreate_Cuda() local
|
| H A D | ceed-cuda-ref-qfunctioncontext.c | 150 …ContextSetDataHost_Cuda(const CeedQFunctionContext ctx, const CeedCopyMode copy_mode, void *data) { in CeedQFunctionContextSetDataHost_Cuda() 181 …ntextSetDataDevice_Cuda(const CeedQFunctionContext ctx, const CeedCopyMode copy_mode, void *data) { in CeedQFunctionContextSetDataDevice_Cuda() 218 …t CeedQFunctionContext ctx, const CeedMemType mem_type, const CeedCopyMode copy_mode, void *data) { in CeedQFunctionContextSetData_Cuda() 232 …ctionContextTakeData_Cuda(const CeedQFunctionContext ctx, const CeedMemType mem_type, void *data) { in CeedQFunctionContextTakeData_Cuda() 262 …onContextGetDataCore_Cuda(const CeedQFunctionContext ctx, const CeedMemType mem_type, void *data) { in CeedQFunctionContextGetDataCore_Cuda() 287 …onContextGetDataRead_Cuda(const CeedQFunctionContext ctx, const CeedMemType mem_type, void *data) { in CeedQFunctionContextGetDataRead_Cuda() 294 …nctionContextGetData_Cuda(const CeedQFunctionContext ctx, const CeedMemType mem_type, void *data) { in CeedQFunctionContextGetData_Cuda()
|
| /libCEED/backends/hip-ref/ |
| H A D | ceed-hip-ref-qfunctioncontext.c | 149 …nContextSetDataHost_Hip(const CeedQFunctionContext ctx, const CeedCopyMode copy_mode, void *data) { in CeedQFunctionContextSetDataHost_Hip() 180 …ontextSetDataDevice_Hip(const CeedQFunctionContext ctx, const CeedCopyMode copy_mode, void *data) { in CeedQFunctionContextSetDataDevice_Hip() 217 …t CeedQFunctionContext ctx, const CeedMemType mem_type, const CeedCopyMode copy_mode, void *data) { in CeedQFunctionContextSetData_Hip() 231 …nctionContextTakeData_Hip(const CeedQFunctionContext ctx, const CeedMemType mem_type, void *data) { in CeedQFunctionContextTakeData_Hip() 261 …ionContextGetDataCore_Hip(const CeedQFunctionContext ctx, const CeedMemType mem_type, void *data) { in CeedQFunctionContextGetDataCore_Hip() 286 …ionContextGetDataRead_Hip(const CeedQFunctionContext ctx, const CeedMemType mem_type, void *data) { in CeedQFunctionContextGetDataRead_Hip() 293 …unctionContextGetData_Hip(const CeedQFunctionContext ctx, const CeedMemType mem_type, void *data) { in CeedQFunctionContextGetData_Hip()
|
| H A D | ceed-hip-ref-qfunction.c | 25 CeedQFunction_Hip *data; in CeedQFunctionApply_Hip() local 71 CeedQFunction_Hip *data; in CeedQFunctionDestroy_Hip() local 85 CeedQFunction_Hip *data; in CeedQFunctionCreate_Hip() local
|
| /libCEED/backends/magma/ |
| H A D | ceed-magma-common.c | 19 Ceed_Magma *data; in CeedInit_Magma_common() local 46 Ceed_Magma *data; in CeedDestroy_Magma() local
|
| /libCEED/backends/opt/ |
| H A D | ceed-opt-blocked.c | 19 Ceed_Opt *data; in CeedDestroy_Opt() local 31 Ceed_Opt *data; in CeedInit_Opt_Blocked() local
|
| H A D | ceed-opt-serial.c | 19 Ceed_Opt *data; in CeedDestroy_Opt() local 31 Ceed_Opt *data; in CeedInit_Opt_Serial() local
|
| /libCEED/backends/sycl/ |
| H A D | ceed-sycl-common.sycl.cpp | 19 Ceed_Sycl *data; in CeedInit_Sycl() local 82 Ceed_Sycl *data; in CeedDestroy_Sycl() local 94 Ceed_Sycl *data; in CeedSetStream_Sycl() local
|
| /libCEED/backends/sycl-ref/ |
| H A D | ceed-sycl-ref-qfunctioncontext.sycl.cpp | 161 …ContextSetDataHost_Sycl(const CeedQFunctionContext ctx, const CeedCopyMode copy_mode, void *data) { in CeedQFunctionContextSetDataHost_Sycl() 192 …ntextSetDataDevice_Sycl(const CeedQFunctionContext ctx, const CeedCopyMode copy_mode, void *data) { in CeedQFunctionContextSetDataDevice_Sycl() 242 …t CeedQFunctionContext ctx, const CeedMemType mem_type, const CeedCopyMode copy_mode, void *data) { in CeedQFunctionContextSetData_Sycl() 256 …ctionContextTakeData_Sycl(const CeedQFunctionContext ctx, const CeedMemType mem_type, void *data) { in CeedQFunctionContextTakeData_Sycl() 294 …onContextGetDataCore_Sycl(const CeedQFunctionContext ctx, const CeedMemType mem_type, void *data) { in CeedQFunctionContextGetDataCore_Sycl() 319 …onContextGetDataRead_Sycl(const CeedQFunctionContext ctx, const CeedMemType mem_type, void *data) { in CeedQFunctionContextGetDataRead_Sycl() 326 …nctionContextGetData_Sycl(const CeedQFunctionContext ctx, const CeedMemType mem_type, void *data) { in CeedQFunctionContextGetData_Sycl()
|
| /libCEED/backends/hip-gen/ |
| H A D | ceed-hip-gen-qfunction.c | 26 CeedQFunction_Hip_gen *data; in CeedQFunctionDestroy_Hip_gen() local 39 CeedQFunction_Hip_gen *data; in CeedQFunctionCreate_Hip_gen() local
|
| /libCEED/backends/cuda-gen/ |
| H A D | ceed-cuda-gen-qfunction.c | 26 CeedQFunction_Cuda_gen *data; in CeedQFunctionDestroy_Cuda_gen() local 39 CeedQFunction_Cuda_gen *data; in CeedQFunctionCreate_Cuda_gen() local
|