xref: /libCEED/rust/libceed-sys/c-src/backends/cuda-gen/ceed-cuda-gen.h (revision d4cc18453651bd0f94c1a2e078b2646a92dafdcc)
1*9ba83ac0SJeremy L Thompson // Copyright (c) 2017-2026, Lawrence Livermore National Security, LLC and other CEED contributors.
23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
3241a4b83SYohann //
43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause
5241a4b83SYohann //
63d8e8822SJeremy L Thompson // This file is part of CEED:  http://github.com/ceed
7509d4af6SJeremy L Thompson #pragma once
83d576824SJeremy L Thompson 
949aac155SJeremy L Thompson #include <ceed.h>
10ec3da8bcSJed Brown #include <ceed/backend.h>
1149aac155SJeremy L Thompson #include <ceed/jit-source/cuda/cuda-types.h>
12241a4b83SYohann #include <cuda.h>
132b730f8bSJeremy L Thompson 
14241a4b83SYohann typedef struct {
150183ed61SJeremy L Thompson   bool           use_fallback, use_assembly_fallback;
16241a4b83SYohann   CeedInt        dim;
17c433aabcSJeremy L Thompson   CeedInt        Q, Q_1d;
189e201c85SYohann   CeedInt        max_P_1d;
19a61b1c91SJeremy L Thompson   CeedInt        thread_1d;
200816752eSJeremy L Thompson   CUmodule       module, module_assemble_full, module_assemble_diagonal, module_assemble_qfunction;
210816752eSJeremy L Thompson   CUfunction     op, assemble_full, assemble_diagonal, assemble_qfunction;
229e201c85SYohann   FieldsInt_Cuda indices;
239e201c85SYohann   Fields_Cuda    fields;
249e201c85SYohann   Fields_Cuda    B;
259e201c85SYohann   Fields_Cuda    G;
26241a4b83SYohann   CeedScalar    *W;
278b97b69aSJeremy L Thompson   Points_Cuda    points;
28241a4b83SYohann } CeedOperator_Cuda_gen;
29241a4b83SYohann 
30241a4b83SYohann typedef struct {
3109095acaSJeremy L Thompson   const char *qfunction_name;
32241a4b83SYohann   void       *d_c;
33241a4b83SYohann } CeedQFunction_Cuda_gen;
34241a4b83SYohann 
35241a4b83SYohann CEED_INTERN int CeedQFunctionCreate_Cuda_gen(CeedQFunction qf);
36241a4b83SYohann 
37241a4b83SYohann CEED_INTERN int CeedOperatorCreate_Cuda_gen(CeedOperator op);
38