| /libCEED/include/ceed/jit-source/cuda/ |
| H A D | cuda-shared-basis-tensor.h | 18 extern "C" __global__ void Interp(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *… in Interp() 56 extern "C" __global__ void InterpCollocated(const CeedInt num_elem, const CeedScalar *c_B, const Ce… in InterpCollocated() 86 extern "C" __global__ void InterpTranspose(const CeedInt num_elem, const CeedScalar *c_B, const Cee… in InterpTranspose() 125 extern "C" __global__ void InterpCollocatedTranspose(const CeedInt num_elem, const CeedScalar *c_B,… in InterpCollocatedTranspose() 155 extern "C" __global__ void InterpTransposeAdd(const CeedInt num_elem, const CeedScalar *c_B, const … in InterpTransposeAdd() 194 …lobal__ void InterpCollocatedTransposeAdd(const CeedInt num_elem, const CeedScalar *c_B, const Cee… in InterpCollocatedTransposeAdd() 227 extern "C" __global__ void Grad(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *c_… in Grad() 270 extern "C" __global__ void GradCollocated(const CeedInt num_elem, const CeedScalar *c_B, const Ceed… in GradCollocated() 310 extern "C" __global__ void GradTranspose(const CeedInt num_elem, const CeedScalar *c_B, const CeedS… in GradTranspose() 353 extern "C" __global__ void GradCollocatedTranspose(const CeedInt num_elem, const CeedScalar *c_B, c… in GradCollocatedTranspose() [all …]
|
| H A D | cuda-shared-basis-tensor-templates.h | 52 …terp1d(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, CeedScala… in Interp1d() 62 …InterpTranspose1d(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTranspose1d() 73 …CollocatedNodes1d(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpCollocatedNodes1d() 84 …CollocatedNodes1d(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTransposeCollocatedNodes1d() 95 …Grad1d(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const Cee… in Grad1d() 106 …pose1d(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const Cee… in GradTranspose1d() 208 …id InterpTensor2d(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTensor2d() 221 …TransposeTensor2d(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTransposeTensor2d() 234 …CollocatedNodes2d(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTensorCollocatedNodes2d() 245 …CollocatedNodes2d(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTransposeTensorCollocatedNodes2d() [all …]
|
| H A D | cuda-shared-basis-tensor-flattened-templates.h | 131 …InterpTensor2dFlattened(SharedData_Cuda &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTensor2dFlattened() 150 …nsposeTensor2dFlattened(SharedData_Cuda &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTransposeTensor2dFlattened() 168 …locatedNodes2dFlattened(SharedData_Cuda &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTensorCollocatedNodes2dFlattened() 185 …locatedNodes2dFlattened(SharedData_Cuda &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTransposeTensorCollocatedNodes2dFlattened() 201 …r2dFlattened(SharedData_Cuda &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const Cee… in GradTensor2dFlattened() 222 …nsposeTensor2dFlattened(SharedData_Cuda &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in GradTransposeTensor2dFlattened() 242 …locatedNodes2dFlattened(SharedData_Cuda &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in GradTensorCollocatedNodes2dFlattened() 260 …locatedNodes2dFlattened(SharedData_Cuda &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in GradTransposeTensorCollocatedNodes2dFlattened() 468 …InterpTensor3dFlattened(SharedData_Cuda &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTensor3dFlattened() 488 …nsposeTensor3dFlattened(SharedData_Cuda &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTransposeTensor3dFlattened() [all …]
|
| H A D | cuda-shared-basis-tensor-at-points.h | 23 …"C" __global__ void InterpAtPoints(const CeedInt num_elem, const CeedScalar *__restrict__ c_B, con… in InterpAtPoints() 78 …__global__ void InterpTransposeAtPoints(const CeedInt num_elem, const CeedScalar *__restrict__ c_B, in InterpTransposeAtPoints() 148 …lobal__ void InterpTransposeAddAtPoints(const CeedInt num_elem, const CeedScalar *__restrict__ c_B, in InterpTransposeAddAtPoints() 210 extern "C" __global__ void GradAtPoints(const CeedInt num_elem, const CeedScalar *__restrict__ c_B,… in GradAtPoints() 265 …" __global__ void GradTransposeAtPoints(const CeedInt num_elem, const CeedScalar *__restrict__ c_B, in GradTransposeAtPoints() 336 …_global__ void GradTransposeAddAtPoints(const CeedInt num_elem, const CeedScalar *__restrict__ c_B, in GradTransposeAddAtPoints()
|
| H A D | cuda-shared-basis-nontensor.h | 18 extern "C" __global__ void Interp(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *… in Interp() 44 extern "C" __global__ void InterpTranspose(const CeedInt num_elem, const CeedScalar *c_B, const Cee… in InterpTranspose() 71 extern "C" __global__ void InterpTransposeAdd(const CeedInt num_elem, const CeedScalar *c_B, const … in InterpTransposeAdd()
|
| H A D | cuda-shared-basis-nontensor-templates.h | 47 …d InterpNonTensor(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpNonTensor() 58 …ransposeNonTensor(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTransposeNonTensor()
|
| /libCEED/include/ceed/jit-source/hip/ |
| H A D | hip-shared-basis-tensor-templates.h | 52 …nterp1d(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, CeedScala… in Interp1d() 62 … InterpTranspose1d(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTranspose1d() 73 …pCollocatedNodes1d(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpCollocatedNodes1d() 84 …eCollocatedNodes1d(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTransposeCollocatedNodes1d() 95 … Grad1d(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const Cee… in Grad1d() 106 …spose1d(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const Cee… in GradTranspose1d() 208 …ensor2d(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, CeedScala… in InterpTensor2d() 220 …pTransposeTensor2d(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTransposeTensor2d() 233 …rCollocatedNodes2d(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTensorCollocatedNodes2d() 244 …rCollocatedNodes2d(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTransposeTensorCollocatedNodes2d() [all …]
|
| H A D | hip-shared-basis-tensor-flattened-templates.h | 131 … InterpTensor2dFlattened(SharedData_Hip &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTensor2dFlattened() 150 …ansposeTensor2dFlattened(SharedData_Hip &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTransposeTensor2dFlattened() 168 …llocatedNodes2dFlattened(SharedData_Hip &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTensorCollocatedNodes2dFlattened() 185 …llocatedNodes2dFlattened(SharedData_Hip &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTransposeTensorCollocatedNodes2dFlattened() 201 …or2dFlattened(SharedData_Hip &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const Cee… in GradTensor2dFlattened() 222 …ansposeTensor2dFlattened(SharedData_Hip &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in GradTransposeTensor2dFlattened() 242 …llocatedNodes2dFlattened(SharedData_Hip &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in GradTensorCollocatedNodes2dFlattened() 260 …llocatedNodes2dFlattened(SharedData_Hip &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in GradTransposeTensorCollocatedNodes2dFlattened() 468 … InterpTensor3dFlattened(SharedData_Hip &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTensor3dFlattened() 488 …ansposeTensor3dFlattened(SharedData_Hip &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTransposeTensor3dFlattened() [all …]
|
| H A D | hip-shared-basis-nontensor-templates.h | 47 …id InterpNonTensor(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpNonTensor() 58 …TransposeNonTensor(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, in InterpTransposeNonTensor()
|