| /libCEED/include/ceed/jit-source/sycl/ |
| H A D | sycl-shared-basis-tensor.h | 165 CeedScalar r_W[BASIS_DIM > 2 ? BASIS_Q_1D : 1]; in Weight() local 170 Weight1d(BASIS_Q_1D, q_weight_1d, r_W); in Weight() 171 …eElementStrided1d(1, BASIS_Q_1D, num_elem, 1, BASIS_NUM_QPTS * num_elem, BASIS_NUM_QPTS, r_W, d_W); in Weight() 174 WeightTensor2d(BASIS_Q_1D, q_weight_1d, r_W); in Weight() 175 …eElementStrided2d(1, BASIS_Q_1D, num_elem, 1, BASIS_NUM_QPTS * num_elem, BASIS_NUM_QPTS, r_W, d_W); in Weight() 178 WeightTensor3d(BASIS_Q_1D, q_weight_1d, r_W); in Weight() 179 …eElementStrided3d(1, BASIS_Q_1D, num_elem, 1, BASIS_NUM_QPTS * num_elem, BASIS_NUM_QPTS, r_W, d_W); in Weight()
|
| /libCEED/include/ceed/jit-source/cuda/ |
| H A D | cuda-shared-basis-nontensor.h | 194 CeedScalar r_W[1]; in Weight() local 197 WeightNonTensor<BASIS_P, BASIS_Q>(data, q_weight, r_W); in Weight() 198 WriteElementStrided1d<1, BASIS_Q>(data, elem, 1, BASIS_Q * num_elem, BASIS_Q, r_W, d_W); in Weight()
|
| H A D | cuda-shared-basis-tensor.h | 489 CeedScalar r_W[BASIS_DIM > 2 ? BASIS_Q_1D : 1]; in Weight() local 494 Weight1d<BASIS_P_1D, BASIS_Q_1D>(data, q_weight_1d, r_W); in Weight() 495 … WriteElementStrided1d<1, BASIS_Q_1D>(data, elem, 1, BASIS_Q_1D * num_elem, BASIS_Q_1D, r_W, d_W); in Weight() 497 WeightTensor2d<BASIS_P_1D, BASIS_Q_1D>(data, q_weight_1d, r_W); in Weight() 498 … BASIS_Q_1D>(data, elem, 1, BASIS_Q_1D * BASIS_Q_1D * num_elem, BASIS_Q_1D * BASIS_Q_1D, r_W, d_W); in Weight() 500 WeightTensor3d<BASIS_P_1D, BASIS_Q_1D>(data, q_weight_1d, r_W); in Weight() 501 …lem, 1, BASIS_Q_1D * BASIS_Q_1D * BASIS_Q_1D * num_elem, BASIS_Q_1D * BASIS_Q_1D * BASIS_Q_1D, r_W, in Weight()
|
| /libCEED/include/ceed/jit-source/hip/ |
| H A D | hip-shared-basis-nontensor.h | 197 CeedScalar r_W[1]; in __launch_bounds__() local 200 WeightNonTensor<BASIS_P, BASIS_Q>(data, q_weight, r_W); in __launch_bounds__() 201 WriteElementStrided1d<1, BASIS_Q>(data, elem, 1, BASIS_Q * num_elem, BASIS_Q, r_W, d_W); in __launch_bounds__()
|
| H A D | hip-shared-basis-tensor.h | 497 CeedScalar r_W[BASIS_DIM > 2 ? BASIS_Q_1D : 1]; in __launch_bounds__() local 501 Weight1d<BASIS_P_1D, BASIS_Q_1D>(data, q_weight_1d, r_W); in __launch_bounds__() 502 … WriteElementStrided1d<1, BASIS_Q_1D>(data, elem, 1, BASIS_Q_1D * num_elem, BASIS_Q_1D, r_W, d_W); in __launch_bounds__() 504 WeightTensor2d<BASIS_P_1D, BASIS_Q_1D>(data, q_weight_1d, r_W); in __launch_bounds__() 505 … BASIS_Q_1D>(data, elem, 1, BASIS_Q_1D * BASIS_Q_1D * num_elem, BASIS_Q_1D * BASIS_Q_1D, r_W, d_W); in __launch_bounds__() 507 WeightTensor3d<BASIS_P_1D, BASIS_Q_1D>(data, q_weight_1d, r_W); in __launch_bounds__() 508 …lem, 1, BASIS_Q_1D * BASIS_Q_1D * BASIS_Q_1D * num_elem, BASIS_Q_1D * BASIS_Q_1D * BASIS_Q_1D, r_W, in __launch_bounds__()
|