| /libCEED/include/ceed/jit-source/magma/ |
| H A D | magma-common-tensor.h | 19 …_inline__ void read_1d(const T *devptr, const int compstride, T *sBuffer[NUM_COMP], const int tx) { in read_1d() 31 …e__ __inline__ void write_1d(T *sBuffer[NUM_COMP], T *devptr, const int compstride, const int tx) { in write_1d() 43 …ice__ __inline__ void sum_1d(T *sBuffer[NUM_COMP], T *devptr, const int compstride, const int tx) { in sum_1d() 59 …ad_U_2d(const T *dU, const int compstride, T rU[DIM_U][NUM_COMP][rU_SIZE], T *sTmp, const int tx) { in read_U_2d() 95 …_ void read_V_2d(const T *dV, const int compstride, T rV[DIM_V][NUM_COMP][rV_SIZE], const int tx) { in read_V_2d() 112 …line__ void write_V_2d(T *dV, const int compstride, T rV[DIM_V][NUM_COMP][rV_SIZE], const int tx) { in write_V_2d() 129 …inline__ void sum_V_2d(T *dV, const int compstride, T rV[DIM_V][NUM_COMP][rV_SIZE], const int tx) { in sum_V_2d() 147 …ad_U_3d(const T *dU, const int compstride, T rU[DIM_U][NUM_COMP][rU_SIZE], T *sTmp, const int tx) { in read_U_3d() 183 …_ void read_V_3d(const T *dV, const int compstride, T rV[DIM_V][NUM_COMP][rV_SIZE], const int tx) { in read_V_3d() 200 …line__ void write_V_3d(T *dV, const int compstride, T rV[DIM_V][NUM_COMP][rV_SIZE], const int tx) { in write_V_3d() [all …]
|
| H A D | magma-common-nontensor.h | 20 static __device__ __inline__ void read_A_notrans_g2r_1D_nosync(const int tx, const int ty, const T … in read_A_notrans_g2r_1D_nosync() 45 static __device__ __inline__ void read_A_trans_g2r_1D_nosync(const int tx, const int ty, const T *d… in read_A_trans_g2r_1D_nosync() 70 static __device__ __inline__ void read_B_g2s_1D_nosync(const int tx, const int n, const T *dB, T *s… in read_B_g2s_1D_nosync() 94 static __device__ __inline__ void write_C_r2g_1D_nosync(const int tx, const int n, T rC[NB], T *dC)… in write_C_r2g_1D_nosync() 113 static __device__ __inline__ void sum_C_r2g_1D_nosync(const int tx, const int n, T rC[NB], T *dC) { in sum_C_r2g_1D_nosync()
|
| H A D | magma-basis-interp-deriv-nontensor.h | 16 const int tx = threadIdx.x; in magma_basis_nontensor_device_n() local 59 const int tx = threadIdx.x; in magma_basis_nontensor_device_t() local 105 const int tx = threadIdx.x; in magma_basis_nontensor_device_ta() local 151 const int tx = threadIdx.x; in magma_basis_nontensor_device_n1() local 187 const int tx = threadIdx.x; in magma_basis_nontensor_device_t1() local 223 const int tx = threadIdx.x; in magma_basis_nontensor_device_ta1() local
|
| H A D | magma-basis-weight-nontensor.h | 17 const int tx = threadIdx.x; in __launch_bounds__() local
|
| H A D | magma-basis-weight-1d.h | 15 static __device__ __inline__ void magma_weight_1d_device(const T *sTweight, T *sV, const int tx) { in magma_weight_1d_device()
|
| H A D | magma-basis-weight-3d.h | 15 …_ __inline__ void magma_weight_3d_device(const T *sTweight, T rV[DIM][NUM_COMP][Q], const int tx) { in magma_weight_3d_device()
|
| H A D | magma-basis-weight-2d.h | 15 …_ __inline__ void magma_weight_2d_device(const T *sTweight, T rV[DIM][NUM_COMP][Q], const int tx) { in magma_weight_2d_device()
|
| H A D | magma-basis-grad-1d.h | 18 …__inline__ void magma_grad_1d_device(const T *sT, T *sU[NUM_COMP], T *sV[NUM_COMP], const int tx) { in magma_grad_1d_device()
|
| H A D | magma-basis-interp-1d.h | 18 …inline__ void magma_interp_1d_device(const T *sT, T *sU[NUM_COMP], T *sV[NUM_COMP], const int tx) { in magma_interp_1d_device()
|
| H A D | magma-basis-interp-2d.h | 19 …d_device(const T *sT, T rU[DIM_U][NUM_COMP][rU_SIZE], T rV[DIM_V][NUM_COMP][rV_SIZE], const int tx, in magma_interp_2d_device()
|
| H A D | magma-basis-interp-3d.h | 19 …d_device(const T *sT, T rU[DIM_U][NUM_COMP][rU_SIZE], T rV[DIM_V][NUM_COMP][rV_SIZE], const int tx, in magma_interp_3d_device()
|