Searched refs:q_bytes (Results 1 – 4 of 4) sorted by relevance
| /libCEED/backends/hip-ref/ |
| H A D | ceed-hip-ref-basis.c | 402 const CeedInt q_bytes = Q_1d * sizeof(CeedScalar); in CeedBasisCreateTensorH1_Hip() local 403 const CeedInt interp_bytes = q_bytes * P_1d; in CeedBasisCreateTensorH1_Hip() 411 CeedCallHip(ceed, hipMalloc((void **)&data->d_q_weight_1d, q_bytes)); in CeedBasisCreateTensorH1_Hip() 412 CeedCallHip(ceed, hipMemcpy(data->d_q_weight_1d, q_weight_1d, q_bytes, hipMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Hip() 449 const CeedInt q_bytes = num_qpts * sizeof(CeedScalar); in CeedBasisCreateH1_Hip() local 459 CeedCallHip(ceed, hipMalloc((void **)&data->d_q_weight, q_bytes)); in CeedBasisCreateH1_Hip() 460 CeedCallHip(ceed, hipMemcpy(data->d_q_weight, q_weight, q_bytes, hipMemcpyHostToDevice)); in CeedBasisCreateH1_Hip() 463 const CeedInt interp_bytes = q_bytes * num_nodes * q_comp_interp; in CeedBasisCreateH1_Hip() 469 const CeedInt grad_bytes = q_bytes * num_nodes * q_comp_grad; in CeedBasisCreateH1_Hip() 504 const CeedInt q_bytes = num_qpts * sizeof(CeedScalar); in CeedBasisCreateHdiv_Hip() local [all …]
|
| /libCEED/backends/cuda-ref/ |
| H A D | ceed-cuda-ref-basis.c | 403 const CeedInt q_bytes = Q_1d * sizeof(CeedScalar); in CeedBasisCreateTensorH1_Cuda() local 404 const CeedInt interp_bytes = q_bytes * P_1d; in CeedBasisCreateTensorH1_Cuda() 412 CeedCallCuda(ceed, cudaMalloc((void **)&data->d_q_weight_1d, q_bytes)); in CeedBasisCreateTensorH1_Cuda() 413 … CeedCallCuda(ceed, cudaMemcpy(data->d_q_weight_1d, q_weight_1d, q_bytes, cudaMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Cuda() 450 const CeedInt q_bytes = num_qpts * sizeof(CeedScalar); in CeedBasisCreateH1_Cuda() local 460 CeedCallCuda(ceed, cudaMalloc((void **)&data->d_q_weight, q_bytes)); in CeedBasisCreateH1_Cuda() 461 CeedCallCuda(ceed, cudaMemcpy(data->d_q_weight, q_weight, q_bytes, cudaMemcpyHostToDevice)); in CeedBasisCreateH1_Cuda() 464 const CeedInt interp_bytes = q_bytes * num_nodes * q_comp_interp; in CeedBasisCreateH1_Cuda() 470 const CeedInt grad_bytes = q_bytes * num_nodes * q_comp_grad; in CeedBasisCreateH1_Cuda() 505 const CeedInt q_bytes = num_qpts * sizeof(CeedScalar); in CeedBasisCreateHdiv_Cuda() local [all …]
|
| /libCEED/backends/hip-shared/ |
| H A D | ceed-hip-shared-basis.c | 659 const CeedInt q_bytes = Q_1d * sizeof(CeedScalar); in CeedBasisCreateTensorH1_Hip_shared() local 660 const CeedInt interp_bytes = q_bytes * P_1d; in CeedBasisCreateTensorH1_Hip_shared() 668 CeedCallHip(ceed, hipMalloc((void **)&data->d_q_weight_1d, q_bytes)); in CeedBasisCreateTensorH1_Hip_shared() 669 CeedCallHip(ceed, hipMemcpy(data->d_q_weight_1d, q_weight_1d, q_bytes, hipMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Hip_shared() 685 CeedCallHip(ceed, hipMalloc((void **)&data->d_collo_grad_1d, q_bytes * Q_1d)); in CeedBasisCreateTensorH1_Hip_shared() 686 …CeedCallHip(ceed, hipMemcpy(data->d_collo_grad_1d, collo_grad_1d, q_bytes * Q_1d, hipMemcpyHostToD… in CeedBasisCreateTensorH1_Hip_shared() 732 const CeedInt q_bytes = num_qpts * sizeof(CeedScalar); in CeedBasisCreateH1_Hip_shared() local 756 CeedCallHip(ceed, hipMalloc((void **)&data->d_q_weight_1d, q_bytes)); in CeedBasisCreateH1_Hip_shared() 757 CeedCallHip(ceed, hipMemcpy(data->d_q_weight_1d, q_weight, q_bytes, hipMemcpyHostToDevice)); in CeedBasisCreateH1_Hip_shared() 760 const CeedInt interp_bytes = q_bytes * num_nodes * q_comp_interp; in CeedBasisCreateH1_Hip_shared() [all …]
|
| /libCEED/backends/cuda-shared/ |
| H A D | ceed-cuda-shared-basis.c | 598 const CeedInt q_bytes = Q_1d * sizeof(CeedScalar); in CeedBasisCreateTensorH1_Cuda_shared() local 599 const CeedInt interp_bytes = q_bytes * P_1d; in CeedBasisCreateTensorH1_Cuda_shared() 607 CeedCallCuda(ceed, cudaMalloc((void **)&data->d_q_weight_1d, q_bytes)); in CeedBasisCreateTensorH1_Cuda_shared() 608 … CeedCallCuda(ceed, cudaMemcpy(data->d_q_weight_1d, q_weight_1d, q_bytes, cudaMemcpyHostToDevice)); in CeedBasisCreateTensorH1_Cuda_shared() 624 CeedCallCuda(ceed, cudaMalloc((void **)&data->d_collo_grad_1d, q_bytes * Q_1d)); in CeedBasisCreateTensorH1_Cuda_shared() 625 …CeedCallCuda(ceed, cudaMemcpy(data->d_collo_grad_1d, collo_grad_1d, q_bytes * Q_1d, cudaMemcpyHost… in CeedBasisCreateTensorH1_Cuda_shared() 666 const CeedInt q_bytes = num_qpts * sizeof(CeedScalar); in CeedBasisCreateH1_Cuda_shared() local 690 CeedCallCuda(ceed, cudaMalloc((void **)&data->d_q_weight_1d, q_bytes)); in CeedBasisCreateH1_Cuda_shared() 691 CeedCallCuda(ceed, cudaMemcpy(data->d_q_weight_1d, q_weight, q_bytes, cudaMemcpyHostToDevice)); in CeedBasisCreateH1_Cuda_shared() 694 const CeedInt interp_bytes = q_bytes * num_nodes * q_comp_interp; in CeedBasisCreateH1_Cuda_shared() [all …]
|