xref: /libCEED/backends/cuda-ref/ceed-cuda-ref-qfunction.c (revision 3bd616174f267007922ecd7132753928e1173772)
1 // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors.
2 // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
3 //
4 // SPDX-License-Identifier: BSD-2-Clause
5 //
6 // This file is part of CEED:  http://github.com/ceed
7 
8 #include <ceed.h>
9 #include <ceed/backend.h>
10 #include <ceed/jit-source/cuda/cuda-types.h>
11 #include <cuda.h>
12 
13 #include "../cuda/ceed-cuda-common.h"
14 #include "../cuda/ceed-cuda-compile.h"
15 #include "ceed-cuda-ref-qfunction-load.h"
16 #include "ceed-cuda-ref.h"
17 
18 //------------------------------------------------------------------------------
19 // Apply QFunction
20 //------------------------------------------------------------------------------
21 static int CeedQFunctionApply_Cuda(CeedQFunction qf, CeedInt Q, CeedVector *U, CeedVector *V) {
22   Ceed                ceed;
23   Ceed_Cuda          *ceed_Cuda;
24   CeedInt             num_input_fields, num_output_fields;
25   CeedQFunction_Cuda *data;
26 
27   CeedCallBackend(CeedQFunctionGetCeed(qf, &ceed));
28 
29   // Build and compile kernel, if not done
30   CeedCallBackend(CeedQFunctionBuildKernel_Cuda_ref(qf));
31 
32   CeedCallBackend(CeedQFunctionGetData(qf, &data));
33   CeedCallBackend(CeedGetData(ceed, &ceed_Cuda));
34   CeedCallBackend(CeedQFunctionGetNumArgs(qf, &num_input_fields, &num_output_fields));
35 
36   // Read vectors
37   for (CeedInt i = 0; i < num_input_fields; i++) {
38     CeedCallBackend(CeedVectorGetArrayRead(U[i], CEED_MEM_DEVICE, &data->fields.inputs[i]));
39   }
40   for (CeedInt i = 0; i < num_output_fields; i++) {
41     CeedCallBackend(CeedVectorGetArrayWrite(V[i], CEED_MEM_DEVICE, &data->fields.outputs[i]));
42   }
43 
44   // Get context data
45   CeedCallBackend(CeedQFunctionGetInnerContextData(qf, CEED_MEM_DEVICE, &data->d_c));
46 
47   // Run kernel
48   void *args[] = {&data->d_c, (void *)&Q, &data->fields};
49   CeedCallBackend(CeedRunKernelAutoblockCuda(ceed, data->QFunction, Q, args));
50 
51   // Restore vectors
52   for (CeedInt i = 0; i < num_input_fields; i++) {
53     CeedCallBackend(CeedVectorRestoreArrayRead(U[i], &data->fields.inputs[i]));
54   }
55   for (CeedInt i = 0; i < num_output_fields; i++) {
56     CeedCallBackend(CeedVectorRestoreArray(V[i], &data->fields.outputs[i]));
57   }
58 
59   // Restore context
60   CeedCallBackend(CeedQFunctionRestoreInnerContextData(qf, &data->d_c));
61   return CEED_ERROR_SUCCESS;
62 }
63 
64 //------------------------------------------------------------------------------
65 // Destroy QFunction
66 //------------------------------------------------------------------------------
67 static int CeedQFunctionDestroy_Cuda(CeedQFunction qf) {
68   Ceed                ceed;
69   CeedQFunction_Cuda *data;
70 
71   CeedCallBackend(CeedQFunctionGetData(qf, &data));
72   CeedCallBackend(CeedQFunctionGetCeed(qf, &ceed));
73   if (data->module) CeedCallCuda(ceed, cuModuleUnload(data->module));
74   CeedCallBackend(CeedFree(&data));
75   return CEED_ERROR_SUCCESS;
76 }
77 
78 //------------------------------------------------------------------------------
79 // Set User QFunction
80 //------------------------------------------------------------------------------
81 static int CeedQFunctionSetCUDAUserFunction_Cuda(CeedQFunction qf, CUfunction f) {
82   CeedQFunction_Cuda *data;
83 
84   CeedCallBackend(CeedQFunctionGetData(qf, &data));
85   data->QFunction = f;
86   return CEED_ERROR_SUCCESS;
87 }
88 
89 //------------------------------------------------------------------------------
90 // Create QFunction
91 //------------------------------------------------------------------------------
92 int CeedQFunctionCreate_Cuda(CeedQFunction qf) {
93   Ceed                ceed;
94   CeedQFunction_Cuda *data;
95 
96   CeedQFunctionGetCeed(qf, &ceed);
97   CeedCallBackend(CeedCalloc(1, &data));
98   CeedCallBackend(CeedQFunctionSetData(qf, data));
99 
100   // Read QFunction source
101   CeedCallBackend(CeedQFunctionGetKernelName(qf, &data->qfunction_name));
102   CeedDebug256(ceed, CEED_DEBUG_COLOR_SUCCESS, "----- Loading QFunction User Source -----\n");
103   CeedCallBackend(CeedQFunctionLoadSourceToBuffer(qf, &data->qfunction_source));
104   CeedDebug256(ceed, CEED_DEBUG_COLOR_SUCCESS, "----- Loading QFunction User Source Complete! -----\n");
105 
106   // Register backend functions
107   CeedCallBackend(CeedSetBackendFunction(ceed, "QFunction", qf, "Apply", CeedQFunctionApply_Cuda));
108   CeedCallBackend(CeedSetBackendFunction(ceed, "QFunction", qf, "Destroy", CeedQFunctionDestroy_Cuda));
109   CeedCallBackend(CeedSetBackendFunction(ceed, "QFunction", qf, "SetCUDAUserFunction", CeedQFunctionSetCUDAUserFunction_Cuda));
110   return CEED_ERROR_SUCCESS;
111 }
112 
113 //------------------------------------------------------------------------------
114