| /libCEED/include/ceed/jit-source/hip/ |
| H A D | hip-gen-templates.h | 59 template <int NUM_COMP, int P_1D> 61 const CeedInt target_comp = n / P_1D; in SetEVecStandard1d_Single() 62 const CeedInt target_node = n % P_1D; in SetEVecStandard1d_Single() 72 template <int NUM_COMP, int COMP_STRIDE, int P_1D> 75 if (data.t_id_x < P_1D) { in ReadLVecStandard1d() 77 const CeedInt ind = indices[node + elem * P_1D]; in ReadLVecStandard1d() 86 template <int NUM_COMP, int P_1D, int STRIDES_NODE, int STRIDES_COMP, int STRIDES_ELEM> 88 if (data.t_id_x < P_1D) { in ReadLVecStrided1d() 99 template <int NUM_COMP, int COMP_STRIDE, int P_1D> 102 if (data.t_id_x < P_1D) { in WriteLVecStandard1d() [all …]
|
| H A D | hip-shared-basis-tensor-templates.h | 19 template <int NUM_COMP, int P_1D, int Q_1D> 26 for (CeedInt i = 0; i < P_1D; i++) { in ContractX1d() 27 *V += B[i + data.t_id_x * P_1D] * data.slice[i]; // Contract x direction in ContractX1d() 35 template <int NUM_COMP, int P_1D, int Q_1D> 41 if (data.t_id_x < P_1D) { in ContractTransposeX1d() 43 *V += B[data.t_id_x + i * P_1D] * data.slice[i]; // Contract x direction in ContractTransposeX1d() 51 template <int NUM_COMP, int P_1D, int Q_1D, int T_1D> 54 ContractX1d<NUM_COMP, P_1D, Q_1D>(data, &r_U[comp], c_B, &r_V[comp]); in Interp1d() 61 template <int NUM_COMP, int P_1D, int Q_1D, int T_1D> 65 ContractTransposeX1d<NUM_COMP, P_1D, Q_1D>(data, &r_U[comp], c_B, &r_V[comp]); in InterpTranspose1d() [all …]
|
| H A D | hip-shared-basis-read-write-templates.h | 27 template <int NUM_COMP, int P_1D> 30 if (data.t_id_x < P_1D) { in ReadElementStrided1d() 43 template <int NUM_COMP, int P_1D> 46 if (data.t_id_x < P_1D) { in WriteElementStrided1d() 56 template <int NUM_COMP, int P_1D> 59 if (data.t_id_x < P_1D) { in SumElementStrided1d() 76 template <int NUM_COMP, int P_1D> 79 if (data.t_id_x < P_1D && data.t_id_y < P_1D) { in ReadElementStrided2d() 80 const CeedInt node = data.t_id_x + data.t_id_y * P_1D; in ReadElementStrided2d() 92 template <int NUM_COMP, int P_1D> [all …]
|
| H A D | hip-shared-basis-tensor-flattened-templates.h | 19 template <int NUM_COMP, int P_1D, int Q_1D, int T_1D> 26 if (t_id_x < Q_1D && t_id_y < P_1D) { in ContractX2dFlattened() 27 for (CeedInt i = 0; i < P_1D; i++) { in ContractX2dFlattened() 28 *V += B[i + t_id_x * P_1D] * data.slice[i + t_id_y * T_1D]; // Contract x direction in ContractX2dFlattened() 36 template <int NUM_COMP, int P_1D, int Q_1D, int T_1D> 44 for (CeedInt i = 0; i < P_1D; i++) { in ContractY2dFlattened() 45 *V += B[i + t_id_y * P_1D] * data.slice[t_id_x + i * T_1D]; // Contract y direction in ContractY2dFlattened() 53 template <int NUM_COMP, int P_1D, int Q_1D, int T_1D> 60 if (t_id_x < Q_1D && t_id_y < P_1D) { in ContractTransposeY2dFlattened() 62 *V += B[t_id_y + i * P_1D] * data.slice[t_id_x + i * T_1D]; // Contract y direction in ContractTransposeY2dFlattened() [all …]
|
| H A D | hip-shared-basis-nontensor-templates.h | 15 template <int NUM_COMP, int P_1D, int Q_1D> 21 for (CeedInt i = 0; i < P_1D; i++) { in Contract1d() 22 *V += B[i + data.t_id_x * P_1D] * data.slice[i]; // Contract x direction in Contract1d() 31 template <int NUM_COMP, int P_1D, int Q_1D> 35 if (data.t_id_x < P_1D) { in ContractTranspose1d() 37 *V += B[data.t_id_x + i * P_1D] * data.slice[i]; // Contract x direction in ContractTranspose1d()
|
| H A D | hip-shared-basis-tensor-at-points-templates.h | 43 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 65 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 90 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 112 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 141 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 172 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 210 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 245 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 291 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 328 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> [all …]
|
| /libCEED/include/ceed/jit-source/cuda/ |
| H A D | cuda-gen-templates.h | 59 template <int NUM_COMP, int P_1D> 61 const CeedInt target_comp = n / P_1D; in SetEVecStandard1d_Single() 62 const CeedInt target_node = n % P_1D; in SetEVecStandard1d_Single() 72 template <int NUM_COMP, int COMP_STRIDE, int P_1D> 75 if (data.t_id_x < P_1D) { in ReadLVecStandard1d() 77 const CeedInt ind = indices[node + elem * P_1D]; in ReadLVecStandard1d() 86 template <int NUM_COMP, int P_1D, int STRIDES_NODE, int STRIDES_COMP, int STRIDES_ELEM> 89 if (data.t_id_x < P_1D) { in ReadLVecStrided1d() 100 template <int NUM_COMP, int COMP_STRIDE, int P_1D> 103 if (data.t_id_x < P_1D) { in WriteLVecStandard1d() [all …]
|
| H A D | cuda-shared-basis-tensor-templates.h | 19 template <int NUM_COMP, int P_1D, int Q_1D> 26 for (CeedInt i = 0; i < P_1D; i++) { in ContractX1d() 27 *V += B[i + data.t_id_x * P_1D] * data.slice[i]; // Contract x direction in ContractX1d() 35 template <int NUM_COMP, int P_1D, int Q_1D> 41 if (data.t_id_x < P_1D) { in ContractTransposeX1d() 43 *V += B[data.t_id_x + i * P_1D] * data.slice[i]; // Contract x direction in ContractTransposeX1d() 51 template <int NUM_COMP, int P_1D, int Q_1D, int T_1D> 54 ContractX1d<NUM_COMP, P_1D, Q_1D>(data, &r_U[comp], c_B, &r_V[comp]); in Interp1d() 61 template <int NUM_COMP, int P_1D, int Q_1D, int T_1D> 65 ContractTransposeX1d<NUM_COMP, P_1D, Q_1D>(data, &r_U[comp], c_B, &r_V[comp]); in InterpTranspose1d() [all …]
|
| H A D | cuda-shared-basis-read-write-templates.h | 27 template <int NUM_COMP, int P_1D> 30 if (data.t_id_x < P_1D) { in ReadElementStrided1d() 43 template <int NUM_COMP, int P_1D> 46 if (data.t_id_x < P_1D) { in WriteElementStrided1d() 56 template <int NUM_COMP, int P_1D> 59 if (data.t_id_x < P_1D) { in SumElementStrided1d() 76 template <int NUM_COMP, int P_1D> 79 if (data.t_id_x < P_1D && data.t_id_y < P_1D) { in ReadElementStrided2d() 80 const CeedInt node = data.t_id_x + data.t_id_y * P_1D; in ReadElementStrided2d() 92 template <int NUM_COMP, int P_1D> [all …]
|
| H A D | cuda-shared-basis-tensor-flattened-templates.h | 19 template <int NUM_COMP, int P_1D, int Q_1D, int T_1D> 26 if (t_id_x < Q_1D && t_id_y < P_1D) { in ContractX2dFlattened() 27 for (CeedInt i = 0; i < P_1D; i++) { in ContractX2dFlattened() 28 *V += B[i + t_id_x * P_1D] * data.slice[i + t_id_y * T_1D]; // Contract x direction in ContractX2dFlattened() 36 template <int NUM_COMP, int P_1D, int Q_1D, int T_1D> 44 for (CeedInt i = 0; i < P_1D; i++) { in ContractY2dFlattened() 45 *V += B[i + t_id_y * P_1D] * data.slice[t_id_x + i * T_1D]; // Contract y direction in ContractY2dFlattened() 53 template <int NUM_COMP, int P_1D, int Q_1D, int T_1D> 60 if (t_id_x < Q_1D && t_id_y < P_1D) { in ContractTransposeY2dFlattened() 62 *V += B[t_id_y + i * P_1D] * data.slice[t_id_x + i * T_1D]; // Contract y direction in ContractTransposeY2dFlattened() [all …]
|
| H A D | cuda-shared-basis-nontensor-templates.h | 15 template <int NUM_COMP, int P_1D, int Q_1D> 21 for (CeedInt i = 0; i < P_1D; i++) { in Contract1d() 22 *V += B[i + data.t_id_x * P_1D] * data.slice[i]; // Contract x direction in Contract1d() 31 template <int NUM_COMP, int P_1D, int Q_1D> 35 if (data.t_id_x < P_1D) { in ContractTranspose1d() 37 *V += B[data.t_id_x + i * P_1D] * data.slice[i]; // Contract x direction in ContractTranspose1d()
|
| H A D | cuda-shared-basis-tensor-at-points-templates.h | 43 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 64 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 89 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 111 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 140 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 171 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 209 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 244 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 290 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> 327 template <int NUM_COMP, int NUM_POINTS, int P_1D, int Q_1D> [all …]
|
| /libCEED/include/ceed/jit-source/sycl/ |
| H A D | sycl-shared-basis-tensor-templates.h | 19 inline void ContractX1d(const CeedInt P_1D, const CeedInt Q_1D, private const CeedScalar *restrict … in ContractX1d() argument 28 for (CeedInt i = 0; i < P_1D; i++) { in ContractX1d() 29 *V += B[i + item_id_x * P_1D] * scratch[i]; // Contract x direction in ContractX1d() 38 inline void ContractTransposeX1d(const CeedInt P_1D, const CeedInt Q_1D, private const CeedScalar *… in ContractTransposeX1d() argument 46 if (item_id_x < P_1D) { in ContractTransposeX1d() 48 *V += B[item_id_x + i * P_1D] * scratch[i]; // Contract x direction in ContractTransposeX1d() 57 inline void Interp1d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt Q_1D, private const … in Interp1d() argument 60 ContractX1d(P_1D, Q_1D, r_U + comp, s_B, r_V + comp, scratch); in Interp1d() 67 inline void InterpTranspose1d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt Q_1D, priva… in InterpTranspose1d() argument 70 ContractTransposeX1d(P_1D, Q_1D, r_U + comp, s_B, r_V + comp, scratch); in InterpTranspose1d() [all …]
|
| H A D | sycl-shared-basis-read-write-templates.h | 28 inline void ReadElementStrided1d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_elem… in ReadElementStrided1d() argument 34 if (item_id_x < P_1D && elem < num_elem) { in ReadElementStrided1d() 46 inline void WriteElementStrided1d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_ele… in WriteElementStrided1d() argument 52 if (item_id_x < P_1D && elem < num_elem) { in WriteElementStrided1d() 68 inline void ReadElementStrided2d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_elem… in ReadElementStrided2d() argument 75 if (item_id_x < P_1D && item_id_y < P_1D && elem < num_elem) { in ReadElementStrided2d() 76 const CeedInt node = item_id_x + item_id_y * P_1D; in ReadElementStrided2d() 87 inline void WriteElementStrided2d(const CeedInt NUM_COMP, const CeedInt P_1D, const CeedInt num_ele… in WriteElementStrided2d() argument 94 if (item_id_x < P_1D && item_id_y < P_1D && elem < num_elem) { in WriteElementStrided2d() 95 const CeedInt node = item_id_x + item_id_y * P_1D; in WriteElementStrided2d() [all …]
|
| H A D | sycl-gen-templates.h | 33 inline void readDofsOffset1d(const CeedInt num_comp, const CeedInt strides_comp, const CeedInt P_1D… in readDofsOffset1d() argument 38 if (item_id_x < P_1D && elem < num_elem) { in readDofsOffset1d() 40 const CeedInt ind = indices[node + elem * P_1D]; in readDofsOffset1d() 50 inline void readDofsStrided1d(const CeedInt num_comp, const CeedInt P_1D, const CeedInt strides_nod… in readDofsStrided1d() argument 56 if (item_id_x < P_1D && elem < num_elem) { in readDofsStrided1d() 68 …ffset1d(const CeedInt num_comp, const CeedInt strides_comp, const CeedInt P_1D, const CeedInt num_… in writeDofsOffset1d() argument 73 if (item_id_x < P_1D && elem < num_elem) { in writeDofsOffset1d() 75 const CeedInt ind = indices[node + elem * P_1D]; in writeDofsOffset1d() 84 inline void writeDofsStrided1d(const CeedInt num_comp, const CeedInt P_1D, const CeedInt strides_no… in writeDofsStrided1d() argument 90 if (item_id_x < P_1D && elem < num_elem) { in writeDofsStrided1d() [all …]
|
| /libCEED/tests/ |
| H A D | t319-basis.c | 208 CeedInt face_dim = 2, P_1D = 2; in main() local 216 CeedBasisCreateTensorH1Lagrange(ceed, face_dim, 1, 2, P_1D, CEED_GAUSS, &basis_face); in main()
|