| /libCEED/backends/magma/ |
| H A D | ceed-magma-gemm-nontensor.cpp | 26 magma_int_t lddc, magma_queue_t queue) { in magmablas_gemm() argument 29 queue); in magmablas_gemm() 32 queue); in magmablas_gemm() 41 … magma_int_t lddc, magma_int_t strideC, magma_int_t batchCount, magma_queue_t queue) { in magmablas_gemm_batched_strided() argument 44 (float)beta, (float *)d_C, lddc, strideC, batchCount, queue); in magmablas_gemm_batched_strided() 47 (double)beta, (double *)d_C, lddc, strideC, batchCount, queue); in magmablas_gemm_batched_strided() 55 magma_int_t lddc, magma_queue_t queue) { in devblas_gemm() argument 57 …alpha, (const float *)d_A, ldda, (const float *)d_B, lddb, (float)beta, (float *)d_C, lddc, queue); in devblas_gemm() 60 queue); in devblas_gemm() 69 … magma_int_t strideC, magma_int_t batchCount, magma_queue_t queue) { in devblas_gemm_batched_strided() argument [all …]
|
| H A D | ceed-magma-common.c | 35 magma_queue_create_from_hip(data->device_id, NULL, NULL, NULL, &(data->queue)); in CeedInit_Magma_common() 37 magma_queue_create_from_cuda(data->device_id, NULL, NULL, NULL, &(data->queue)); in CeedInit_Magma_common() 49 magma_queue_destroy(data->queue); in CeedDestroy_Magma()
|
| H A D | ceed-magma-basis.c | 245 ceed_magma_queue_sync(data->queue); in CeedBasisApplyCore_Magma() 437 …ns, MagmaNoTrans, P, N, Q, 1.0, d_b + d * P * Q, P, d_u + d * N * Q, Q, beta, d_v, P, data->queue); in CeedBasisApplyNonTensorCore_Magma() 439 …ans, MagmaNoTrans, Q, N, P, 1.0, d_b + d * P * Q, P, d_u, P, 0.0, d_v + d * N * Q, Q, data->queue); in CeedBasisApplyNonTensorCore_Magma() 455 ceed_magma_queue_sync(data->queue); in CeedBasisApplyNonTensorCore_Magma() 549 …magma_setvector(Q_1d, sizeof(q_weight_1d[0]), q_weight_1d, 1, impl->d_q_weight_1d, 1, data->queue); in CeedBasisCreateTensorH1_Magma() 552 …agma_setvector(Q_1d * P_1d, sizeof(interp_1d[0]), interp_1d, 1, impl->d_interp_1d, 1, data->queue); in CeedBasisCreateTensorH1_Magma() 554 magma_setvector(Q_1d * P_1d, sizeof(grad_1d[0]), grad_1d, 1, impl->d_grad_1d, 1, data->queue); in CeedBasisCreateTensorH1_Magma() 655 magma_setvector(num_qpts, sizeof(q_weight[0]), q_weight, 1, impl->d_q_weight, 1, data->queue); in CeedBasisCreateH1_Magma() 662 …um_qpts * num_nodes * q_comp_interp, sizeof(interp[0]), interp, 1, impl->d_interp, 1, data->queue); in CeedBasisCreateH1_Magma() 669 …vector(num_qpts * num_nodes * q_comp_grad, sizeof(grad[0]), grad, 1, impl->d_grad, 1, data->queue); in CeedBasisCreateH1_Magma() [all …]
|
| H A D | ceed-magma-common.h | 15 magma_queue_t queue; member
|
| H A D | ceed-magma-gemm-nontensor.h | 14 CeedScalar *d_C, magma_int_t lddc, magma_queue_t queue);
|
| /libCEED/backends/sycl/ |
| H A D | ceed-sycl-common.sycl.cpp | 68 …sycl::queue sycl_queue{sycl_context, sycl_device, sycl_async_handler, sycl::property::queue::in_… in CeedInit_Sycl() 99 sycl::queue *q = static_cast<sycl::queue *>(handle); in CeedSetStream_Sycl()
|
| H A D | ceed-sycl-common.hpp | 37 sycl::queue sycl_queue;
|
| /libCEED/backends/sycl-ref/ |
| H A D | ceed-sycl-restriction.sycl.cpp | 27 static int CeedElemRestrictionStridedNoTranspose_Sycl(sycl::queue &sycl_queue, const CeedElemRestri… in CeedElemRestrictionStridedNoTranspose_Sycl() 54 static int CeedElemRestrictionOffsetNoTranspose_Sycl(sycl::queue &sycl_queue, const CeedElemRestric… in CeedElemRestrictionOffsetNoTranspose_Sycl() 82 static int CeedElemRestrictionStridedTranspose_Sycl(sycl::queue &sycl_queue, const CeedElemRestrict… in CeedElemRestrictionStridedTranspose_Sycl() 110 static int CeedElemRestrictionOffsetTranspose_Sycl(sycl::queue &sycl_queue, const CeedElemRestricti… in CeedElemRestrictionOffsetTranspose_Sycl()
|
| H A D | ceed-sycl-vector.sycl.cpp | 284 static int CeedDeviceSetValue_Sycl(sycl::queue &sycl_queue, CeedScalar *d_array, CeedSize length, C… in CeedDeviceSetValue_Sycl() 506 static int CeedDeviceReciprocal_Sycl(sycl::queue &sycl_queue, CeedScalar *d_array, CeedSize length)… in CeedDeviceReciprocal_Sycl() 548 static int CeedDeviceScale_Sycl(sycl::queue &sycl_queue, CeedScalar *x_array, CeedScalar alpha, Cee… in CeedDeviceScale_Sycl() 588 static int CeedDeviceAXPY_Sycl(sycl::queue &sycl_queue, CeedScalar *y_array, CeedScalar alpha, Ceed… in CeedDeviceAXPY_Sycl() 635 static int CeedDevicePointwiseMult_Sycl(sycl::queue &sycl_queue, CeedScalar *w_array, CeedScalar *x… in CeedDevicePointwiseMult_Sycl()
|
| H A D | ceed-sycl-ref-basis.sycl.cpp | 39 static int CeedBasisApplyInterp_Sycl(sycl::queue &sycl_queue, const SyclModule_t &sycl_module, Ceed… in CeedBasisApplyInterp_Sycl() 142 static int CeedBasisApplyGrad_Sycl(sycl::queue &sycl_queue, const SyclModule_t &sycl_module, CeedIn… in CeedBasisApplyGrad_Sycl() 245 static int CeedBasisApplyWeight_Sycl(sycl::queue &sycl_queue, CeedInt num_elem, const CeedBasis_Syc… in CeedBasisApplyWeight_Sycl() 338 static int CeedBasisApplyNonTensorInterp_Sycl(sycl::queue &sycl_queue, CeedInt num_elem, CeedInt is… in CeedBasisApplyNonTensorInterp_Sycl() 379 static int CeedBasisApplyNonTensorGrad_Sycl(sycl::queue &sycl_queue, CeedInt num_elem, CeedInt is_t… in CeedBasisApplyNonTensorGrad_Sycl() 435 static int CeedBasisApplyNonTensorWeight_Sycl(sycl::queue &sycl_queue, CeedInt num_elem, const Ceed… in CeedBasisApplyNonTensorWeight_Sycl()
|
| H A D | ceed-sycl-ref-operator.sycl.cpp | 832 static int CeedOperatorLinearDiagonal_Sycl(sycl::queue &sycl_queue, const bool is_point_block, cons… in CeedOperatorLinearDiagonal_Sycl() 1189 static int CeedOperatorLinearAssemble_Sycl(sycl::queue &sycl_queue, const CeedOperator_Sycl *impl, … in CeedOperatorLinearAssemble_Sycl()
|