| /libCEED/include/ceed/jit-source/sycl/ |
| H A D | sycl-shared-basis-tensor.h | 24 local CeedScalar s_B[BASIS_P_1D * BASIS_Q_1D]; in Interp() local 33 loadMatrix(BASIS_P_1D * BASIS_Q_1D, d_interp_1d, s_B); in Interp() 38 Interp1d(BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, r_U, s_B, r_V, elem_scratch); in Interp() 43 InterpTensor2d(BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, r_U, s_B, r_V, elem_scratch); in Interp() 48 InterpTensor3d(BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, r_U, s_B, r_V, elem_scratch); in Interp() 58 local CeedScalar s_B[BASIS_P_1D * BASIS_Q_1D]; in InterpTranspose() local 67 loadMatrix(BASIS_P_1D * BASIS_Q_1D, d_interp_1d, s_B); in InterpTranspose() 72 InterpTranspose1d(BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, r_U, s_B, r_V, elem_scratch); in InterpTranspose() 77 InterpTransposeTensor2d(BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, r_U, s_B, r_V, elem_scratch); in InterpTranspose() 82 InterpTransposeTensor3d(BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, r_U, s_B, r_V, elem_scratch); in InterpTranspose() [all …]
|
| H A D | sycl-shared-basis-tensor-templates.h | 58 …local const CeedScalar *restrict s_B, private CeedScalar *restrict r_V, local CeedScalar *restrict… in Interp1d() argument 60 ContractX1d(P_1D, Q_1D, r_U + comp, s_B, r_V + comp, scratch); in Interp1d() 68 …local const CeedScalar *restrict s_B, private CeedScalar *restrict r_V, local CeedScalar *restrict… in InterpTranspose1d() argument 70 ContractTransposeX1d(P_1D, Q_1D, r_U + comp, s_B, r_V + comp, scratch); in InterpTranspose1d() 209 …local const CeedScalar *restrict s_B, private CeedScalar *restrict r_V, local CeedScalar *restrict… in InterpTensor2d() argument 213 ContractX2d(P_1D, Q_1D, r_U + comp, s_B, r_t, scratch); in InterpTensor2d() 214 ContractY2d(P_1D, Q_1D, r_t, s_B, r_V + comp, scratch); in InterpTensor2d() 222 …local const CeedScalar *restrict s_B, private CeedScalar *restrict r_V, local CeedScalar *restrict… in InterpTransposeTensor2d() argument 226 ContractTransposeY2d(P_1D, Q_1D, r_U + comp, s_B, r_t, scratch); in InterpTransposeTensor2d() 227 ContractTransposeX2d(P_1D, Q_1D, r_t, s_B, r_V + comp, scratch); in InterpTransposeTensor2d() [all …]
|
| /libCEED/include/ceed/jit-source/cuda/ |
| H A D | cuda-shared-basis-tensor-at-points.h | 40 __shared__ CeedScalar s_B[BASIS_P_1D * BASIS_Q_1D]; in InterpAtPoints() local 41 LoadMatrix<BASIS_P_1D, BASIS_Q_1D>(data, c_B, s_B); in InterpAtPoints() 49 Interp1d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_C); in InterpAtPoints() 52 InterpTensor2d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_C); in InterpAtPoints() 56 InterpTensor3d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_C); in InterpAtPoints() 96 __shared__ CeedScalar s_B[BASIS_P_1D * BASIS_Q_1D]; in InterpTransposeAtPoints() local 97 LoadMatrix<BASIS_P_1D, BASIS_Q_1D>(data, c_B, s_B); in InterpTransposeAtPoints() 135 InterpTranspose1d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_C, s_B, r_V); in InterpTransposeAtPoints() 138 … InterpTransposeTensor2d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_C, s_B, r_V); in InterpTransposeAtPoints() 141 … InterpTransposeTensor3d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_C, s_B, r_V); in InterpTransposeAtPoints() [all …]
|
| H A D | cuda-shared-basis-tensor.h | 32 __shared__ CeedScalar s_B[BASIS_P_1D * BASIS_Q_1D]; in Interp() local 33 LoadMatrix<BASIS_P_1D, BASIS_Q_1D>(data, c_B, s_B); in Interp() 40 Interp1d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_V); in Interp() 44 InterpTensor2d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_V); in Interp() 49 InterpTensor3d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_V); in Interp() 101 __shared__ CeedScalar s_B[BASIS_P_1D * BASIS_Q_1D]; in InterpTranspose() local 102 LoadMatrix<BASIS_P_1D, BASIS_Q_1D>(data, c_B, s_B); in InterpTranspose() 109 InterpTranspose1d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_V); in InterpTranspose() 113 … InterpTransposeTensor2d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_V); in InterpTranspose() 118 … InterpTransposeTensor3d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_V); in InterpTranspose() [all …]
|
| H A D | cuda-shared-basis-nontensor.h | 32 __shared__ CeedScalar s_B[BASIS_P * BASIS_Q]; in Interp() local 33 LoadMatrix<BASIS_P, BASIS_Q>(data, c_B, s_B); in Interp() 39 InterpNonTensor<BASIS_NUM_COMP, BASIS_P, BASIS_Q, BASIS_T_1D>(data, r_U, s_B, r_V); in Interp() 59 __shared__ CeedScalar s_B[BASIS_P * BASIS_Q]; in InterpTranspose() local 60 LoadMatrix<BASIS_P, BASIS_Q>(data, c_B, s_B); in InterpTranspose() 66 InterpTransposeNonTensor<BASIS_NUM_COMP, BASIS_P, BASIS_Q, BASIS_T_1D>(data, r_U, s_B, r_V); in InterpTranspose() 86 __shared__ CeedScalar s_B[BASIS_P * BASIS_Q]; in InterpTransposeAdd() local 87 LoadMatrix<BASIS_P, BASIS_Q>(data, c_B, s_B); in InterpTransposeAdd() 93 InterpTransposeNonTensor<BASIS_NUM_COMP, BASIS_P, BASIS_Q, BASIS_T_1D>(data, r_U, s_B, r_V); in InterpTransposeAdd()
|
| /libCEED/include/ceed/jit-source/hip/ |
| H A D | hip-shared-basis-tensor-at-points.h | 41 __shared__ CeedScalar s_B[BASIS_P_1D * BASIS_Q_1D]; in __launch_bounds__() local 42 LoadMatrix<BASIS_P_1D, BASIS_Q_1D>(data, c_B, s_B); in __launch_bounds__() 50 Interp1d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_C); in __launch_bounds__() 53 InterpTensor2d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_C); in __launch_bounds__() 57 InterpTensor3d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_C); in __launch_bounds__() 97 __shared__ CeedScalar s_B[BASIS_P_1D * BASIS_Q_1D]; in __launch_bounds__() local 98 LoadMatrix<BASIS_P_1D, BASIS_Q_1D>(data, c_B, s_B); in __launch_bounds__() 136 InterpTranspose1d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_C, s_B, r_V); in __launch_bounds__() 139 … InterpTransposeTensor2d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_C, s_B, r_V); in __launch_bounds__() 142 … InterpTransposeTensor3d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_C, s_B, r_V); in __launch_bounds__() [all …]
|
| H A D | hip-shared-basis-tensor.h | 33 __shared__ CeedScalar s_B[BASIS_P_1D * BASIS_Q_1D]; in __launch_bounds__() local 34 LoadMatrix<BASIS_P_1D, BASIS_Q_1D>(data, c_B, s_B); in __launch_bounds__() 41 Interp1d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_V); in __launch_bounds__() 45 InterpTensor2d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_V); in __launch_bounds__() 50 InterpTensor3d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_V); in __launch_bounds__() 102 __shared__ CeedScalar s_B[BASIS_P_1D * BASIS_Q_1D]; in __launch_bounds__() local 103 LoadMatrix<BASIS_P_1D, BASIS_Q_1D>(data, c_B, s_B); in __launch_bounds__() 110 InterpTranspose1d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_V); in __launch_bounds__() 114 … InterpTransposeTensor2d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_V); in __launch_bounds__() 119 … InterpTransposeTensor3d<BASIS_NUM_COMP, BASIS_P_1D, BASIS_Q_1D, BASIS_T_1D>(data, r_U, s_B, r_V); in __launch_bounds__() [all …]
|
| H A D | hip-shared-basis-nontensor.h | 33 __shared__ CeedScalar s_B[BASIS_P * BASIS_Q]; in __launch_bounds__() local 34 LoadMatrix<BASIS_P, BASIS_Q>(data, c_B, s_B); in __launch_bounds__() 40 InterpNonTensor<BASIS_NUM_COMP, BASIS_P, BASIS_Q, BASIS_T_1D>(data, r_U, s_B, r_V); in __launch_bounds__() 60 __shared__ CeedScalar s_B[BASIS_P * BASIS_Q]; in __launch_bounds__() local 61 LoadMatrix<BASIS_P, BASIS_Q>(data, c_B, s_B); in __launch_bounds__() 67 InterpTransposeNonTensor<BASIS_NUM_COMP, BASIS_P, BASIS_Q, BASIS_T_1D>(data, r_U, s_B, r_V); in __launch_bounds__() 87 __shared__ CeedScalar s_B[BASIS_P * BASIS_Q]; in __launch_bounds__() local 88 LoadMatrix<BASIS_P, BASIS_Q>(data, c_B, s_B); in __launch_bounds__() 94 InterpTransposeNonTensor<BASIS_NUM_COMP, BASIS_P, BASIS_Q, BASIS_T_1D>(data, r_U, s_B, r_V); in __launch_bounds__()
|