| /libCEED/backends/hip-ref/ |
| H A D | ceed-hip-ref-basis.c | 166 CeedSize interp_bytes; in CeedBasisApplyAtPointsCore_Hip() local 169 interp_bytes = P_1d * Q_1d * sizeof(CeedScalar); in CeedBasisApplyAtPointsCore_Hip() 172 CeedCallHip(ceed, hipMalloc((void **)&data->d_chebyshev_interp_1d, interp_bytes)); in CeedBasisApplyAtPointsCore_Hip() 173 …CeedCallHip(ceed, hipMemcpy(data->d_chebyshev_interp_1d, chebyshev_interp_1d, interp_bytes, hipMem… in CeedBasisApplyAtPointsCore_Hip() 403 const CeedInt interp_bytes = q_bytes * P_1d; in CeedBasisCreateTensorH1_Hip() local 414 CeedCallHip(ceed, hipMalloc((void **)&data->d_interp_1d, interp_bytes)); in CeedBasisCreateTensorH1_Hip() 415 CeedCallHip(ceed, hipMemcpy(data->d_interp_1d, interp_1d, interp_bytes, hipMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Hip() 416 CeedCallHip(ceed, hipMalloc((void **)&data->d_grad_1d, interp_bytes)); in CeedBasisCreateTensorH1_Hip() 417 CeedCallHip(ceed, hipMemcpy(data->d_grad_1d, grad_1d, interp_bytes, hipMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Hip() 463 const CeedInt interp_bytes = q_bytes * num_nodes * q_comp_interp; in CeedBasisCreateH1_Hip() local [all …]
|
| H A D | ceed-hip-ref-operator.c | 1206 const CeedInt interp_bytes = num_nodes * num_qpts * sizeof(CeedScalar); in CeedOperatorAssembleDiagonalSetup_Hip() local 1218 CeedCallHip(ceed, hipMalloc((void **)&diag->d_identity, interp_bytes)); in CeedOperatorAssembleDiagonalSetup_Hip() 1219 CeedCallHip(ceed, hipMemcpy(diag->d_identity, identity, interp_bytes, hipMemcpyHostToDevice)); in CeedOperatorAssembleDiagonalSetup_Hip() 1239 CeedCallHip(ceed, hipMalloc((void **)&d_interp, interp_bytes * q_comp_interp)); in CeedOperatorAssembleDiagonalSetup_Hip() 1240 …CeedCallHip(ceed, hipMemcpy(d_interp, interp, interp_bytes * q_comp_interp, hipMemcpyHostToDevice)… in CeedOperatorAssembleDiagonalSetup_Hip() 1242 CeedCallHip(ceed, hipMalloc((void **)&d_grad, interp_bytes * q_comp_grad)); in CeedOperatorAssembleDiagonalSetup_Hip() 1243 … CeedCallHip(ceed, hipMemcpy(d_grad, grad, interp_bytes * q_comp_grad, hipMemcpyHostToDevice)); in CeedOperatorAssembleDiagonalSetup_Hip() 1261 CeedCallHip(ceed, hipMalloc((void **)&d_interp, interp_bytes * q_comp_interp)); in CeedOperatorAssembleDiagonalSetup_Hip() 1262 …CeedCallHip(ceed, hipMemcpy(d_interp, interp, interp_bytes * q_comp_interp, hipMemcpyHostToDevice)… in CeedOperatorAssembleDiagonalSetup_Hip() 1264 CeedCallHip(ceed, hipMalloc((void **)&d_div, interp_bytes * q_comp_div)); in CeedOperatorAssembleDiagonalSetup_Hip() [all …]
|
| /libCEED/backends/cuda-ref/ |
| H A D | ceed-cuda-ref-basis.c | 167 CeedSize interp_bytes; in CeedBasisApplyAtPointsCore_Cuda() local 170 interp_bytes = P_1d * Q_1d * sizeof(CeedScalar); in CeedBasisApplyAtPointsCore_Cuda() 173 CeedCallCuda(ceed, cudaMalloc((void **)&data->d_chebyshev_interp_1d, interp_bytes)); in CeedBasisApplyAtPointsCore_Cuda() 174 …CeedCallCuda(ceed, cudaMemcpy(data->d_chebyshev_interp_1d, chebyshev_interp_1d, interp_bytes, cuda… in CeedBasisApplyAtPointsCore_Cuda() 404 const CeedInt interp_bytes = q_bytes * P_1d; in CeedBasisCreateTensorH1_Cuda() local 415 CeedCallCuda(ceed, cudaMalloc((void **)&data->d_interp_1d, interp_bytes)); in CeedBasisCreateTensorH1_Cuda() 416 …CeedCallCuda(ceed, cudaMemcpy(data->d_interp_1d, interp_1d, interp_bytes, cudaMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Cuda() 417 CeedCallCuda(ceed, cudaMalloc((void **)&data->d_grad_1d, interp_bytes)); in CeedBasisCreateTensorH1_Cuda() 418 CeedCallCuda(ceed, cudaMemcpy(data->d_grad_1d, grad_1d, interp_bytes, cudaMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Cuda() 464 const CeedInt interp_bytes = q_bytes * num_nodes * q_comp_interp; in CeedBasisCreateH1_Cuda() local [all …]
|
| H A D | ceed-cuda-ref-operator.c | 1209 const CeedInt interp_bytes = num_nodes * num_qpts * sizeof(CeedScalar); in CeedOperatorAssembleDiagonalSetup_Cuda() local 1221 CeedCallCuda(ceed, cudaMalloc((void **)&diag->d_identity, interp_bytes)); in CeedOperatorAssembleDiagonalSetup_Cuda() 1222 … CeedCallCuda(ceed, cudaMemcpy(diag->d_identity, identity, interp_bytes, cudaMemcpyHostToDevice)); in CeedOperatorAssembleDiagonalSetup_Cuda() 1242 CeedCallCuda(ceed, cudaMalloc((void **)&d_interp, interp_bytes * q_comp_interp)); in CeedOperatorAssembleDiagonalSetup_Cuda() 1243 …CeedCallCuda(ceed, cudaMemcpy(d_interp, interp, interp_bytes * q_comp_interp, cudaMemcpyHostToDevi… in CeedOperatorAssembleDiagonalSetup_Cuda() 1245 CeedCallCuda(ceed, cudaMalloc((void **)&d_grad, interp_bytes * q_comp_grad)); in CeedOperatorAssembleDiagonalSetup_Cuda() 1246 … CeedCallCuda(ceed, cudaMemcpy(d_grad, grad, interp_bytes * q_comp_grad, cudaMemcpyHostToDevice)); in CeedOperatorAssembleDiagonalSetup_Cuda() 1264 CeedCallCuda(ceed, cudaMalloc((void **)&d_interp, interp_bytes * q_comp_interp)); in CeedOperatorAssembleDiagonalSetup_Cuda() 1265 …CeedCallCuda(ceed, cudaMemcpy(d_interp, interp, interp_bytes * q_comp_interp, cudaMemcpyHostToDevi… in CeedOperatorAssembleDiagonalSetup_Cuda() 1267 CeedCallCuda(ceed, cudaMalloc((void **)&d_div, interp_bytes * q_comp_div)); in CeedOperatorAssembleDiagonalSetup_Cuda() [all …]
|
| /libCEED/backends/hip-shared/ |
| H A D | ceed-hip-shared-basis.c | 340 CeedSize interp_bytes; in CeedBasisApplyAtPointsCore_Hip_shared() local 343 interp_bytes = P_1d * Q_1d * sizeof(CeedScalar); in CeedBasisApplyAtPointsCore_Hip_shared() 346 CeedCallHip(ceed, hipMalloc((void **)&data->d_chebyshev_interp_1d, interp_bytes)); in CeedBasisApplyAtPointsCore_Hip_shared() 347 …CeedCallHip(ceed, hipMemcpy(data->d_chebyshev_interp_1d, chebyshev_interp_1d, interp_bytes, hipMem… in CeedBasisApplyAtPointsCore_Hip_shared() 660 const CeedInt interp_bytes = q_bytes * P_1d; in CeedBasisCreateTensorH1_Hip_shared() local 671 CeedCallHip(ceed, hipMalloc((void **)&data->d_interp_1d, interp_bytes)); in CeedBasisCreateTensorH1_Hip_shared() 672 CeedCallHip(ceed, hipMemcpy(data->d_interp_1d, interp_1d, interp_bytes, hipMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Hip_shared() 673 CeedCallHip(ceed, hipMalloc((void **)&data->d_grad_1d, interp_bytes)); in CeedBasisCreateTensorH1_Hip_shared() 674 CeedCallHip(ceed, hipMemcpy(data->d_grad_1d, grad_1d, interp_bytes, hipMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Hip_shared() 760 const CeedInt interp_bytes = q_bytes * num_nodes * q_comp_interp; in CeedBasisCreateH1_Hip_shared() local [all …]
|
| /libCEED/backends/cuda-shared/ |
| H A D | ceed-cuda-shared-basis.c | 275 CeedSize interp_bytes; in CeedBasisApplyAtPointsCore_Cuda_shared() local 278 interp_bytes = P_1d * Q_1d * sizeof(CeedScalar); in CeedBasisApplyAtPointsCore_Cuda_shared() 281 CeedCallCuda(ceed, cudaMalloc((void **)&data->d_chebyshev_interp_1d, interp_bytes)); in CeedBasisApplyAtPointsCore_Cuda_shared() 282 …CeedCallCuda(ceed, cudaMemcpy(data->d_chebyshev_interp_1d, chebyshev_interp_1d, interp_bytes, cuda… in CeedBasisApplyAtPointsCore_Cuda_shared() 599 const CeedInt interp_bytes = q_bytes * P_1d; in CeedBasisCreateTensorH1_Cuda_shared() local 610 CeedCallCuda(ceed, cudaMalloc((void **)&data->d_interp_1d, interp_bytes)); in CeedBasisCreateTensorH1_Cuda_shared() 611 …CeedCallCuda(ceed, cudaMemcpy(data->d_interp_1d, interp_1d, interp_bytes, cudaMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Cuda_shared() 612 CeedCallCuda(ceed, cudaMalloc((void **)&data->d_grad_1d, interp_bytes)); in CeedBasisCreateTensorH1_Cuda_shared() 613 CeedCallCuda(ceed, cudaMemcpy(data->d_grad_1d, grad_1d, interp_bytes, cudaMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Cuda_shared() 694 const CeedInt interp_bytes = q_bytes * num_nodes * q_comp_interp; in CeedBasisCreateH1_Cuda_shared() local [all …]
|
| /libCEED/backends/hip-gen/ |
| H A D | ceed-hip-gen-operator-build.cpp | 276 CeedSize interp_bytes; in CeedOperatorBuildKernelFieldData_Hip_gen() local 279 interp_bytes = P_1d * Q_1d * sizeof(CeedScalar); in CeedOperatorBuildKernelFieldData_Hip_gen() 282 …(CeedBasisReturnCeed(basis), hipMalloc((void **)&basis_data->d_chebyshev_interp_1d, interp_bytes)); in CeedOperatorBuildKernelFieldData_Hip_gen() 284 …hipMemcpy(basis_data->d_chebyshev_interp_1d, chebyshev_interp_1d, interp_bytes, hipMemcpyHostToDev… in CeedOperatorBuildKernelFieldData_Hip_gen() 314 CeedSize interp_bytes; in CeedOperatorBuildKernelFieldData_Hip_gen() local 317 interp_bytes = P_1d * Q_1d * sizeof(CeedScalar); in CeedOperatorBuildKernelFieldData_Hip_gen() 320 …(CeedBasisReturnCeed(basis), hipMalloc((void **)&basis_data->d_chebyshev_interp_1d, interp_bytes)); in CeedOperatorBuildKernelFieldData_Hip_gen() 322 …hipMemcpy(basis_data->d_chebyshev_interp_1d, chebyshev_interp_1d, interp_bytes, hipMemcpyHostToDev… in CeedOperatorBuildKernelFieldData_Hip_gen()
|
| /libCEED/backends/cuda-gen/ |
| H A D | ceed-cuda-gen-operator-build.cpp | 249 CeedSize interp_bytes; in CeedOperatorBuildKernelFieldData_Cuda_gen() local 252 interp_bytes = P_1d * Q_1d * sizeof(CeedScalar); in CeedOperatorBuildKernelFieldData_Cuda_gen() 255 …CeedBasisReturnCeed(basis), cudaMalloc((void **)&basis_data->d_chebyshev_interp_1d, interp_bytes)); in CeedOperatorBuildKernelFieldData_Cuda_gen() 257 …cudaMemcpy(basis_data->d_chebyshev_interp_1d, chebyshev_interp_1d, interp_bytes, cudaMemcpyHostToD… in CeedOperatorBuildKernelFieldData_Cuda_gen() 287 CeedSize interp_bytes; in CeedOperatorBuildKernelFieldData_Cuda_gen() local 290 interp_bytes = P_1d * Q_1d * sizeof(CeedScalar); in CeedOperatorBuildKernelFieldData_Cuda_gen() 293 …CeedBasisReturnCeed(basis), cudaMalloc((void **)&basis_data->d_chebyshev_interp_1d, interp_bytes)); in CeedOperatorBuildKernelFieldData_Cuda_gen() 295 …cudaMemcpy(basis_data->d_chebyshev_interp_1d, chebyshev_interp_1d, interp_bytes, cudaMemcpyHostToD… in CeedOperatorBuildKernelFieldData_Cuda_gen()
|