xref: /libCEED/rust/libceed-sys/c-src/backends/hip-shared/ceed-hip-shared.h (revision 81ae61599cc0e14ccce523d66e38bf75c6f7903c)
15aed82e4SJeremy L Thompson // Copyright (c) 2017-2024, Lawrence Livermore National Security, LLC and other CEED contributors.
23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
37d8d0e25Snbeams //
43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause
57d8d0e25Snbeams //
63d8e8822SJeremy L Thompson // This file is part of CEED:  http://github.com/ceed
7509d4af6SJeremy L Thompson #pragma once
83d576824SJeremy L Thompson 
949aac155SJeremy L Thompson #include <ceed.h>
10ec3da8bcSJed Brown #include <ceed/backend.h>
113d576824SJeremy L Thompson #include <hip/hip_runtime.h>
122b730f8bSJeremy L Thompson 
137d8d0e25Snbeams typedef struct {
147d8d0e25Snbeams   hipModule_t   module;
15437930d1SJeremy L Thompson   hipFunction_t Interp;
169e201c85SYohann   hipFunction_t InterpTranspose;
17db2becc9SJeremy L Thompson   hipFunction_t InterpTransposeAdd;
18437930d1SJeremy L Thompson   hipFunction_t Grad;
199e201c85SYohann   hipFunction_t GradTranspose;
20db2becc9SJeremy L Thompson   hipFunction_t GradTransposeAdd;
21437930d1SJeremy L Thompson   hipFunction_t Weight;
221dda9c1aSJeremy L Thompson   hipModule_t   moduleAtPoints;
231dda9c1aSJeremy L Thompson   CeedInt       num_points;
241dda9c1aSJeremy L Thompson   hipFunction_t InterpAtPoints;
25*81ae6159SJeremy L Thompson   hipFunction_t InterpTransposeAtPoints;
261dda9c1aSJeremy L Thompson   hipFunction_t GradAtPoints;
27*81ae6159SJeremy L Thompson   hipFunction_t GradTransposeAtPoints;
28437930d1SJeremy L Thompson   CeedInt       block_sizes[3];  // interp, grad, weight thread block sizes
29437930d1SJeremy L Thompson   CeedScalar   *d_interp_1d;
30437930d1SJeremy L Thompson   CeedScalar   *d_grad_1d;
31437930d1SJeremy L Thompson   CeedScalar   *d_collo_grad_1d;
32437930d1SJeremy L Thompson   CeedScalar   *d_q_weight_1d;
331dda9c1aSJeremy L Thompson   CeedScalar   *d_chebyshev_interp_1d;
34111870feSJeremy L Thompson   CeedInt       num_elem_at_points;
35111870feSJeremy L Thompson   CeedInt      *h_points_per_elem;
36111870feSJeremy L Thompson   CeedInt      *d_points_per_elem;
377d8d0e25Snbeams } CeedBasis_Hip_shared;
387d8d0e25Snbeams 
396574a04fSJeremy L Thompson CEED_INTERN int CeedBasisCreateTensorH1_Hip_shared(CeedInt dim, CeedInt P_1d, CeedInt Q_1d, const CeedScalar *interp_1d, const CeedScalar *grad_1d,
406574a04fSJeremy L Thompson                                                    const CeedScalar *q_ref_1d, const CeedScalar *q_weight_1d, CeedBasis basis);
41