Lines Matching refs:opt_elems
73 const CeedInt opt_elems[7] = {0, 32, 8, 6, 4, 2, 8}; in CeedBasisApplyTensorCore_Cuda_shared() local
75 … CeedInt elems_per_block = CeedIntMax(thread_1d < 7 ? opt_elems[thread_1d] / num_comp : 1, 1); in CeedBasisApplyTensorCore_Cuda_shared()
127 const CeedInt opt_elems[7] = {0, 32, 8, 6, 4, 2, 8}; in CeedBasisApplyTensorCore_Cuda_shared() local
129 … CeedInt elems_per_block = CeedIntMax(thread_1d < 7 ? opt_elems[thread_1d] / num_comp : 1, 1); in CeedBasisApplyTensorCore_Cuda_shared()
165 const CeedInt opt_elems = block_size / (Q_1d * Q_1d); in CeedBasisApplyTensorCore_Cuda_shared() local
166 const CeedInt elems_per_block = opt_elems > 0 ? opt_elems : 1; in CeedBasisApplyTensorCore_Cuda_shared()
171 const CeedInt opt_elems = block_size / (Q_1d * Q_1d); in CeedBasisApplyTensorCore_Cuda_shared() local
172 const CeedInt elems_per_block = opt_elems > 0 ? opt_elems : 1; in CeedBasisApplyTensorCore_Cuda_shared()
338 const CeedInt opt_elems[7] = {0, 32, 8, 6, 4, 2, 8}; in CeedBasisApplyAtPointsCore_Cuda_shared() local
340 … CeedInt elems_per_block = CeedIntMax(thread_1d < 7 ? opt_elems[thread_1d] / num_comp : 1, 1); in CeedBasisApplyAtPointsCore_Cuda_shared()
387 const CeedInt opt_elems[7] = {0, 32, 8, 6, 4, 2, 8}; in CeedBasisApplyAtPointsCore_Cuda_shared() local
389 … CeedInt elems_per_block = CeedIntMax(thread_1d < 7 ? opt_elems[thread_1d] / num_comp : 1, 1); in CeedBasisApplyAtPointsCore_Cuda_shared()