| /libCEED/include/ceed/jit-source/cuda/ |
| H A D | cuda-shared-basis-tensor.h | 227 …global__ void Grad(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *c_G, const Cee… in Grad() 270 …oid GradCollocated(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *c_G, const Cee… in GradCollocated() 310 …void GradTranspose(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *c_G, const Cee… in GradTranspose() 353 … void GradCollocatedTranspose(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *c_G, in GradCollocatedTranspose() 393 …d GradTransposeAdd(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *c_G, const Cee… in GradTransposeAdd() 436 …id GradCollocatedTransposeAdd(const CeedInt num_elem, const CeedScalar *c_B, const CeedScalar *c_G, in GradCollocatedTransposeAdd()
|
| H A D | cuda-shared-basis-tensor-templates.h | 95 …dData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in Grad1d() 106 …dData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTranspose1d() 256 …dData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTensor2d() 271 …dData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTransposeTensor2d() 287 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTensorCollocatedNodes2d() 299 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTransposeTensorCollocatedNodes2d() 544 …dData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTensor3d() 565 …dData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTransposeTensor3d() 586 …dData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTensorCollocated3d() 605 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTransposeTensorCollocated3d() [all …]
|
| H A D | cuda-shared-basis-nontensor.h | 101 extern "C" __global__ void Grad(const CeedInt num_elem, const CeedScalar *c_G, const CeedScalar *__… in Grad() 127 extern "C" __global__ void GradTranspose(const CeedInt num_elem, const CeedScalar *c_G, const CeedS… in GradTranspose() 154 extern "C" __global__ void GradTransposeAdd(const CeedInt num_elem, const CeedScalar *c_G, const Ce… in GradTransposeAdd()
|
| H A D | cuda-shared-basis-nontensor-templates.h | 70 …Tensor(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_G, CeedScala… in GradNonTensor() 82 …ransposeNonTensor(SharedData_Cuda &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_G, in GradTransposeNonTensor()
|
| H A D | cuda-shared-basis-tensor-flattened-templates.h | 201 …(SharedData_Cuda &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTensor2dFlattened() 223 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTransposeTensor2dFlattened() 243 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTensorCollocatedNodes2dFlattened() 261 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTransposeTensorCollocatedNodes2dFlattened() 540 …(SharedData_Cuda &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTensor3dFlattened() 567 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTransposeTensor3dFlattened() 592 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTensorCollocated3dFlattened() 615 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTransposeTensor3dFlattened() 640 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTensorCollocatedNodes3dFlattened() 659 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTransposeTensorCollocatedNodes3dFlattened()
|
| H A D | cuda-gen-templates.h | 479 …(SharedData_Cuda &data, const CeedInt q, const CeedScalar *__restrict__ r_U, const CeedScalar *c_G, in GradColloSlice3d() 509 …(SharedData_Cuda &data, const CeedInt q, const CeedScalar *__restrict__ r_U, const CeedScalar *c_G, in GradColloSliceTranspose3d()
|
| /libCEED/include/ceed/jit-source/hip/ |
| H A D | hip-shared-basis-tensor-templates.h | 95 …edData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in Grad1d() 106 …edData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTranspose1d() 255 …edData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTensor2d() 270 …edData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTransposeTensor2d() 286 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTensorCollocatedNodes2d() 298 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTransposeTensorCollocatedNodes2d() 542 …edData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTensor3d() 563 …edData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTransposeTensor3d() 584 …edData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTensorCollocated3d() 603 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTransposeTensorCollocated3d() [all …]
|
| H A D | hip-shared-basis-nontensor-templates.h | 70 …nTensor(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_G, CeedScala… in GradNonTensor() 82 …TransposeNonTensor(SharedData_Hip &data, const CeedScalar *__restrict__ r_U, const CeedScalar *c_G, in GradTransposeNonTensor()
|
| H A D | hip-shared-basis-tensor-flattened-templates.h | 201 …d(SharedData_Hip &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTensor2dFlattened() 223 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTransposeTensor2dFlattened() 243 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTensorCollocatedNodes2dFlattened() 261 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTransposeTensorCollocatedNodes2dFlattened() 540 …d(SharedData_Hip &data, CeedScalar *__restrict__ r_U, const CeedScalar *c_B, const CeedScalar *c_G, in GradTensor3dFlattened() 567 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTransposeTensor3dFlattened() 592 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTensorCollocated3dFlattened() 615 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTransposeTensorCollocated3dFlattened() 637 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTensorCollocatedNodes3dFlattened() 656 … const CeedScalar *c_G, CeedScalar *__restrict__ r_V) { in GradTransposeTensorCollocatedNodes3dFlattened()
|
| H A D | hip-gen-templates.h | 476 …d(SharedData_Hip &data, const CeedInt q, const CeedScalar *__restrict__ r_U, const CeedScalar *c_G, in GradColloSlice3d() 506 …d(SharedData_Hip &data, const CeedInt q, const CeedScalar *__restrict__ r_U, const CeedScalar *c_G, in GradColloSliceTranspose3d()
|