Lines Matching refs:T
19 template <typename T, bool Add>
22 template <typename T>
23 struct magma_grad_3d_device_accumulate<T, true> {
24 static __device__ __inline__ void op(T &rV, const T &rTmp) { rV += rTmp; }
27 template <typename T>
28 struct magma_grad_3d_device_accumulate<T, false> {
29 static __device__ __inline__ void op(T &rV, const T &rTmp) { rV = rTmp; }
40 template <typename T, int DIM_U, int DIM_V, int NUM_COMP, int P, int Q, int rU_SIZE, int rV_SIZE, i…
41 static __device__ __inline__ void magma_grad_3d_device(const T *sTinterp, const T *sTgrad, T rU[DIM…
42 … T rV[DIM_V][NUM_COMP][rV_SIZE], const int tx, T rTmp, T *swork) {
55 T *sW1 = swork;
56 T *sW2 = sW1 + P * P * Q;
62 const T *sT = (i_DIM == 0) ? sTgrad : sTinterp;
63 T *sTmp = sW1 + batchid * (1 * Q);
79 const T *sT = (i_DIM == 1) ? sTgrad : sTinterp;
80 T *sTmp = sW1 + batchid * (Q * P); // sTmp is input
81 T *sTmp2 = sW2 + batchid * (Q * Q); // sTmp2 is output
97 const T *sT = (i_DIM == 2) ? sTgrad : sTinterp;
98 T *sTmp = sW2; // sTmp is input
104 magma_grad_3d_device_accumulate<T, ADD>::op(rV[i_DIM_V][comp][j], rTmp);