Home
last modified time | relevance | path

Searched refs:device_prop (Results 1 – 9 of 9) sorted by relevance

/libCEED/backends/cuda-gen/
H A Dceed-cuda-gen-operator.c212 …CeedCallBackend(BlockGridCalculate(num_elem, min_grid_size / cuda_data->device_prop.multiProcessor… in CeedOperatorApplyAddCore_Cuda_gen()
213 … cuda_data->device_prop.maxThreadsDim[2], cuda_data->device_prop.warpSize, block, &grid)); in CeedOperatorApplyAddCore_Cuda_gen()
215 …CeedInt elems_per_block = CeedIntMin(cuda_data->device_prop.maxThreadsDim[2], CeedIntMax(512 / dat… in CeedOperatorApplyAddCore_Cuda_gen()
467 …CeedCallBackend(BlockGridCalculate(num_elem, min_grid_size / cuda_data->device_prop.multiProcessor… in CeedOperatorLinearAssembleQFunctionCore_Cuda_gen()
468 … cuda_data->device_prop.maxThreadsDim[2], cuda_data->device_prop.warpSize, block, &grid)); in CeedOperatorLinearAssembleQFunctionCore_Cuda_gen()
470 …CeedInt elems_per_block = CeedIntMin(cuda_data->device_prop.maxThreadsDim[2], CeedIntMax(512 / dat… in CeedOperatorLinearAssembleQFunctionCore_Cuda_gen()
641 …CeedCallBackend(BlockGridCalculate(num_elem, min_grid_size / cuda_data->device_prop.multiProcessor… in CeedOperatorLinearAssembleAddDiagonalAtPoints_Cuda_gen()
642 … cuda_data->device_prop.maxThreadsDim[2], cuda_data->device_prop.warpSize, block, &grid)); in CeedOperatorLinearAssembleAddDiagonalAtPoints_Cuda_gen()
806 …CeedCallBackend(BlockGridCalculate(num_elem, min_grid_size / cuda_data->device_prop.multiProcessor… in CeedOperatorAssembleSingleAtPoints_Cuda_gen()
807 … cuda_data->device_prop.maxThreadsDim[2], cuda_data->device_prop.warpSize, block, &grid)); in CeedOperatorAssembleSingleAtPoints_Cuda_gen()
/libCEED/backends/hip/
H A Dceed-hip-common.c33 CeedCallHip(ceed, hipGetDeviceProperties(&data->device_prop, current_device_id)); in CeedInit_Hip()
36 data->has_unified_addressing = xnack_value > 0 ? data->device_prop.unifiedAddressing : 0; in CeedInit_Hip()
H A Dceed-hip-common.h73 struct hipDeviceProp_t device_prop; member
/libCEED/backends/cuda-shared/
H A Dceed-cuda-shared-basis.c62 …CeedInt elems_per_block = CeedIntMin(ceed_Cuda->device_prop.maxThreadsDim[2], CeedIntMax(512 / thr… in CeedBasisApplyTensorCore_Cuda_shared()
116 …CeedInt elems_per_block = CeedIntMin(ceed_Cuda->device_prop.maxThreadsDim[2], CeedIntMax(512 / thr… in CeedBasisApplyTensorCore_Cuda_shared()
326 …CeedInt elems_per_block = CeedIntMin(ceed_Cuda->device_prop.maxThreadsDim[2], CeedIntMax(512 / thr… in CeedBasisApplyAtPointsCore_Cuda_shared()
376 …CeedInt elems_per_block = CeedIntMin(ceed_Cuda->device_prop.maxThreadsDim[2], CeedIntMax(512 / thr… in CeedBasisApplyAtPointsCore_Cuda_shared()
485 …CeedInt elems_per_block = CeedIntMin(ceed_Cuda->device_prop.maxThreadsDim[2], CeedIntMax(512 / thr… in CeedBasisApplyNonTensorCore_Cuda_shared()
509 …CeedInt elems_per_block = CeedIntMin(ceed_Cuda->device_prop.maxThreadsDim[2], CeedIntMax(512 / thr… in CeedBasisApplyNonTensorCore_Cuda_shared()
533 …CeedInt elems_per_block = CeedIntMin(ceed_Cuda->device_prop.maxThreadsDim[2], CeedIntMax(512 / thr… in CeedBasisApplyNonTensorCore_Cuda_shared()
677 cuda_data->device_prop.sharedMemPerBlock) { in CeedBasisCreateH1_Cuda_shared()
/libCEED/backends/cuda/
H A Dceed-cuda-common.h72 struct cudaDeviceProp device_prop; member
H A Dceed-cuda-common.c33 CeedCallCuda(ceed, cudaGetDeviceProperties(&data->device_prop, current_device_id)); in CeedInit_Cuda()
/libCEED/backends/hip-shared/
H A Dceed-hip-shared-basis.c743 hip_data->device_prop.sharedMemPerBlock) { in CeedBasisCreateH1_Hip_shared()
/libCEED/backends/hip-ref/
H A Dceed-hip-ref-operator.c1608 …>block_size_x * asmb->block_size_y * asmb->elems_per_block > hip_data->device_prop.maxThreadsPerBl… in CeedOperatorAssembleSingleSetup_Hip()
/libCEED/backends/cuda-ref/
H A Dceed-cuda-ref-operator.c1611 …block_size_x * asmb->block_size_y * asmb->elems_per_block > cuda_data->device_prop.maxThreadsPerBl… in CeedOperatorAssembleSingleSetup_Cuda()