Home
last modified time | relevance | path

Searched defs:shared_mem (Results 1 – 6 of 6) sorted by relevance

/libCEED/backends/cuda-shared/
H A Dceed-cuda-shared-basis.c64 CeedInt shared_mem = elems_per_block * thread_1d * sizeof(CeedScalar); in CeedBasisApplyTensorCore_Cuda_shared() local
77 CeedInt shared_mem = elems_per_block * thread_1d * thread_1d * sizeof(CeedScalar); in CeedBasisApplyTensorCore_Cuda_shared() local
89 CeedInt shared_mem = elems_per_block * thread_1d * thread_1d * sizeof(CeedScalar); in CeedBasisApplyTensorCore_Cuda_shared() local
118 CeedInt shared_mem = elems_per_block * thread_1d * sizeof(CeedScalar); in CeedBasisApplyTensorCore_Cuda_shared() local
131 CeedInt shared_mem = elems_per_block * thread_1d * thread_1d * sizeof(CeedScalar); in CeedBasisApplyTensorCore_Cuda_shared() local
142 CeedInt shared_mem = elems_per_block * thread_1d * thread_1d * sizeof(CeedScalar); in CeedBasisApplyTensorCore_Cuda_shared() local
328 CeedInt shared_mem = elems_per_block * thread_1d * sizeof(CeedScalar); in CeedBasisApplyAtPointsCore_Cuda_shared() local
342 CeedInt shared_mem = elems_per_block * thread_1d * thread_1d * sizeof(CeedScalar); in CeedBasisApplyAtPointsCore_Cuda_shared() local
354 CeedInt shared_mem = elems_per_block * thread_1d * thread_1d * sizeof(CeedScalar); in CeedBasisApplyAtPointsCore_Cuda_shared() local
378 CeedInt shared_mem = elems_per_block * thread_1d * sizeof(CeedScalar); in CeedBasisApplyAtPointsCore_Cuda_shared() local
[all …]
/libCEED/backends/hip-shared/
H A Dceed-hip-shared-basis.c131 CeedInt shared_mem = elems_per_block * thread_1d * sizeof(CeedScalar); in CeedBasisApplyTensorCore_Hip_shared() local
143 … CeedInt shared_mem = elems_per_block * thread_1d * thread_1d * sizeof(CeedScalar); in CeedBasisApplyTensorCore_Hip_shared() local
154 … CeedInt shared_mem = elems_per_block * thread_1d * thread_1d * sizeof(CeedScalar); in CeedBasisApplyTensorCore_Hip_shared() local
183 CeedInt shared_mem = elems_per_block * thread_1d * sizeof(CeedScalar); in CeedBasisApplyTensorCore_Hip_shared() local
195 … CeedInt shared_mem = elems_per_block * thread_1d * thread_1d * sizeof(CeedScalar); in CeedBasisApplyTensorCore_Hip_shared() local
206 … CeedInt shared_mem = elems_per_block * thread_1d * thread_1d * sizeof(CeedScalar); in CeedBasisApplyTensorCore_Hip_shared() local
394 CeedInt shared_mem = elems_per_block * thread_1d * sizeof(CeedScalar); in CeedBasisApplyAtPointsCore_Hip_shared() local
406 … CeedInt shared_mem = elems_per_block * thread_1d * thread_1d * sizeof(CeedScalar); in CeedBasisApplyAtPointsCore_Hip_shared() local
418 … CeedInt shared_mem = elems_per_block * thread_1d * thread_1d * sizeof(CeedScalar); in CeedBasisApplyAtPointsCore_Hip_shared() local
442 CeedInt shared_mem = elems_per_block * thread_1d * sizeof(CeedScalar); in CeedBasisApplyAtPointsCore_Hip_shared() local
[all …]
/libCEED/backends/magma/
H A Dceed-magma-basis.c91 CeedInt shared_mem = 0; in CeedBasisApplyCore_Magma() local
168 CeedInt shared_mem = 0; in CeedBasisApplyCore_Magma() local
210 CeedInt shared_mem = 0; in CeedBasisApplyCore_Magma() local
429 …CeedInt shared_mem = (t_mode != CEED_TRANSPOSE && q_comp > 1) ? (shared_mem_A + shared_mem_B) : … in CeedBasisApplyNonTensorCore_Magma() local
448 CeedInt shared_mem = Q * sizeof(CeedScalar) + num_t_col * Q * sizeof(CeedScalar); in CeedBasisApplyNonTensorCore_Magma() local
/libCEED/backends/cuda-gen/
H A Dceed-cuda-gen-operator.c220 CeedInt shared_mem = block[0] * block[1] * block[2] * sizeof(CeedScalar); in CeedOperatorApplyAddCore_Cuda_gen() local
475 CeedInt shared_mem = block[0] * block[1] * block[2] * sizeof(CeedScalar); in CeedOperatorLinearAssembleQFunctionCore_Cuda_gen() local
643 CeedInt shared_mem = block[0] * block[1] * block[2] * sizeof(CeedScalar); in CeedOperatorLinearAssembleAddDiagonalAtPoints_Cuda_gen() local
808 CeedInt shared_mem = block[0] * block[1] * block[2] * sizeof(CeedScalar); in CeedOperatorAssembleSingleAtPoints_Cuda_gen() local
/libCEED/backends/hip-ref/
H A Dceed-hip-ref-operator.c1778 CeedInt shared_mem = in CeedOperatorAssembleSingle_Hip() local
/libCEED/backends/cuda-ref/
H A Dceed-cuda-ref-operator.c1781 CeedInt shared_mem = in CeedOperatorAssembleSingle_Cuda() local