xref: /libCEED/backends/cuda-ref/ceed-cuda-ref-qfunction.c (revision 346c77e6436e93de99b1714e06a264fc70d47960)
1 // Copyright (c) 2017-2026, Lawrence Livermore National Security, LLC and other CEED contributors.
2 // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
3 //
4 // SPDX-License-Identifier: BSD-2-Clause
5 //
6 // This file is part of CEED:  http://github.com/ceed
7 
8 #include <ceed.h>
9 #include <ceed/backend.h>
10 #include <ceed/jit-source/cuda/cuda-types.h>
11 #include <cuda.h>
12 
13 #include "../cuda/ceed-cuda-common.h"
14 #include "../cuda/ceed-cuda-compile.h"
15 #include "ceed-cuda-ref-qfunction-load.h"
16 #include "ceed-cuda-ref.h"
17 
18 //------------------------------------------------------------------------------
19 // Apply QFunction
20 //------------------------------------------------------------------------------
21 static int CeedQFunctionApply_Cuda(CeedQFunction qf, CeedInt Q, CeedVector *U, CeedVector *V) {
22   Ceed                ceed;
23   Ceed_Cuda          *ceed_Cuda;
24   CeedInt             num_input_fields, num_output_fields;
25   CeedQFunction_Cuda *data;
26 
27   CeedCallBackend(CeedQFunctionGetCeed(qf, &ceed));
28 
29   // Build and compile kernel, if not done
30   CeedCallBackend(CeedQFunctionBuildKernel_Cuda_ref(qf));
31 
32   CeedCallBackend(CeedQFunctionGetData(qf, &data));
33   CeedCallBackend(CeedGetData(ceed, &ceed_Cuda));
34   CeedCallBackend(CeedQFunctionGetNumArgs(qf, &num_input_fields, &num_output_fields));
35 
36   // Read vectors
37   for (CeedInt i = 0; i < num_input_fields; i++) {
38     CeedCallBackend(CeedVectorGetArrayRead(U[i], CEED_MEM_DEVICE, &data->fields.inputs[i]));
39   }
40   for (CeedInt i = 0; i < num_output_fields; i++) {
41     CeedCallBackend(CeedVectorGetArrayWrite(V[i], CEED_MEM_DEVICE, &data->fields.outputs[i]));
42   }
43 
44   // Get context data
45   CeedCallBackend(CeedQFunctionGetInnerContextData(qf, CEED_MEM_DEVICE, &data->d_c));
46 
47   // Run kernel
48   void *args[] = {&data->d_c, (void *)&Q, &data->fields};
49   CeedCallBackend(CeedRunKernelAutoblockCuda(ceed, data->QFunction, Q, args));
50 
51   // Restore vectors
52   for (CeedInt i = 0; i < num_input_fields; i++) {
53     CeedCallBackend(CeedVectorRestoreArrayRead(U[i], &data->fields.inputs[i]));
54   }
55   for (CeedInt i = 0; i < num_output_fields; i++) {
56     CeedCallBackend(CeedVectorRestoreArray(V[i], &data->fields.outputs[i]));
57   }
58 
59   // Restore context
60   CeedCallBackend(CeedQFunctionRestoreInnerContextData(qf, &data->d_c));
61   CeedCallBackend(CeedDestroy(&ceed));
62   return CEED_ERROR_SUCCESS;
63 }
64 
65 //------------------------------------------------------------------------------
66 // Destroy QFunction
67 //------------------------------------------------------------------------------
68 static int CeedQFunctionDestroy_Cuda(CeedQFunction qf) {
69   CeedQFunction_Cuda *data;
70 
71   CeedCallBackend(CeedQFunctionGetData(qf, &data));
72   if (data->module) CeedCallCuda(CeedQFunctionReturnCeed(qf), cuModuleUnload(data->module));
73   CeedCallBackend(CeedFree(&data));
74   return CEED_ERROR_SUCCESS;
75 }
76 
77 //------------------------------------------------------------------------------
78 // Set User QFunction
79 //------------------------------------------------------------------------------
80 static int CeedQFunctionSetCUDAUserFunction_Cuda(CeedQFunction qf, CUfunction f) {
81   CeedQFunction_Cuda *data;
82 
83   CeedCallBackend(CeedQFunctionGetData(qf, &data));
84   data->QFunction = f;
85   return CEED_ERROR_SUCCESS;
86 }
87 
88 //------------------------------------------------------------------------------
89 // Create QFunction
90 //------------------------------------------------------------------------------
91 int CeedQFunctionCreate_Cuda(CeedQFunction qf) {
92   Ceed                ceed;
93   CeedQFunction_Cuda *data;
94 
95   CeedCallBackend(CeedQFunctionGetCeed(qf, &ceed));
96   CeedCallBackend(CeedCalloc(1, &data));
97   CeedCallBackend(CeedQFunctionSetData(qf, data));
98 
99   CeedCallBackend(CeedQFunctionGetKernelName(qf, &data->qfunction_name));
100 
101   // Register backend functions
102   CeedCallBackend(CeedSetBackendFunction(ceed, "QFunction", qf, "Apply", CeedQFunctionApply_Cuda));
103   CeedCallBackend(CeedSetBackendFunction(ceed, "QFunction", qf, "Destroy", CeedQFunctionDestroy_Cuda));
104   CeedCallBackend(CeedSetBackendFunction(ceed, "QFunction", qf, "SetCUDAUserFunction", CeedQFunctionSetCUDAUserFunction_Cuda));
105   CeedCallBackend(CeedDestroy(&ceed));
106   return CEED_ERROR_SUCCESS;
107 }
108 
109 //------------------------------------------------------------------------------
110