1 // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors. 2 // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 3 // 4 // SPDX-License-Identifier: BSD-2-Clause 5 // 6 // This file is part of CEED: http://github.com/ceed 7 8 #include <ceed.h> 9 #include <ceed/backend.h> 10 #include <ceed/jit-source/cuda/cuda-types.h> 11 #include <cuda.h> 12 13 #include "../cuda/ceed-cuda-common.h" 14 #include "../cuda/ceed-cuda-compile.h" 15 #include "ceed-cuda-ref-qfunction-load.h" 16 #include "ceed-cuda-ref.h" 17 18 //------------------------------------------------------------------------------ 19 // Apply QFunction 20 //------------------------------------------------------------------------------ 21 static int CeedQFunctionApply_Cuda(CeedQFunction qf, CeedInt Q, CeedVector *U, CeedVector *V) { 22 Ceed ceed; 23 Ceed_Cuda *ceed_Cuda; 24 CeedInt num_input_fields, num_output_fields; 25 CeedQFunction_Cuda *data; 26 27 CeedCallBackend(CeedQFunctionGetCeed(qf, &ceed)); 28 29 // Build and compile kernel, if not done 30 CeedCallBackend(CeedQFunctionBuildKernel_Cuda_ref(qf)); 31 32 CeedCallBackend(CeedQFunctionGetData(qf, &data)); 33 CeedCallBackend(CeedGetData(ceed, &ceed_Cuda)); 34 CeedCallBackend(CeedQFunctionGetNumArgs(qf, &num_input_fields, &num_output_fields)); 35 36 // Read vectors 37 for (CeedInt i = 0; i < num_input_fields; i++) { 38 CeedCallBackend(CeedVectorGetArrayRead(U[i], CEED_MEM_DEVICE, &data->fields.inputs[i])); 39 } 40 for (CeedInt i = 0; i < num_output_fields; i++) { 41 CeedCallBackend(CeedVectorGetArrayWrite(V[i], CEED_MEM_DEVICE, &data->fields.outputs[i])); 42 } 43 44 // Get context data 45 CeedCallBackend(CeedQFunctionGetInnerContextData(qf, CEED_MEM_DEVICE, &data->d_c)); 46 47 // Run kernel 48 void *args[] = {&data->d_c, (void *)&Q, &data->fields}; 49 CeedCallBackend(CeedRunKernelAutoblockCuda(ceed, data->QFunction, Q, args)); 50 51 // Restore vectors 52 for (CeedInt i = 0; i < num_input_fields; i++) { 53 CeedCallBackend(CeedVectorRestoreArrayRead(U[i], &data->fields.inputs[i])); 54 } 55 for (CeedInt i = 0; i < num_output_fields; i++) { 56 CeedCallBackend(CeedVectorRestoreArray(V[i], &data->fields.outputs[i])); 57 } 58 59 // Restore context 60 CeedCallBackend(CeedQFunctionRestoreInnerContextData(qf, &data->d_c)); 61 return CEED_ERROR_SUCCESS; 62 } 63 64 //------------------------------------------------------------------------------ 65 // Destroy QFunction 66 //------------------------------------------------------------------------------ 67 static int CeedQFunctionDestroy_Cuda(CeedQFunction qf) { 68 CeedQFunction_Cuda *data; 69 70 CeedCallBackend(CeedQFunctionGetData(qf, &data)); 71 if (data->module) CeedCallCuda(CeedQFunctionReturnCeed(qf), cuModuleUnload(data->module)); 72 CeedCallBackend(CeedFree(&data)); 73 return CEED_ERROR_SUCCESS; 74 } 75 76 //------------------------------------------------------------------------------ 77 // Set User QFunction 78 //------------------------------------------------------------------------------ 79 static int CeedQFunctionSetCUDAUserFunction_Cuda(CeedQFunction qf, CUfunction f) { 80 CeedQFunction_Cuda *data; 81 82 CeedCallBackend(CeedQFunctionGetData(qf, &data)); 83 data->QFunction = f; 84 return CEED_ERROR_SUCCESS; 85 } 86 87 //------------------------------------------------------------------------------ 88 // Create QFunction 89 //------------------------------------------------------------------------------ 90 int CeedQFunctionCreate_Cuda(CeedQFunction qf) { 91 Ceed ceed; 92 CeedQFunction_Cuda *data; 93 94 CeedCallBackend(CeedQFunctionGetCeed(qf, &ceed)); 95 CeedCallBackend(CeedCalloc(1, &data)); 96 CeedCallBackend(CeedQFunctionSetData(qf, data)); 97 98 // Read QFunction source 99 CeedCallBackend(CeedQFunctionGetKernelName(qf, &data->qfunction_name)); 100 CeedDebug256(ceed, CEED_DEBUG_COLOR_SUCCESS, "----- Loading QFunction User Source -----\n"); 101 CeedCallBackend(CeedQFunctionLoadSourceToBuffer(qf, &data->qfunction_source)); 102 CeedDebug256(ceed, CEED_DEBUG_COLOR_SUCCESS, "----- Loading QFunction User Source Complete! -----\n"); 103 104 // Register backend functions 105 CeedCallBackend(CeedSetBackendFunction(ceed, "QFunction", qf, "Apply", CeedQFunctionApply_Cuda)); 106 CeedCallBackend(CeedSetBackendFunction(ceed, "QFunction", qf, "Destroy", CeedQFunctionDestroy_Cuda)); 107 CeedCallBackend(CeedSetBackendFunction(ceed, "QFunction", qf, "SetCUDAUserFunction", CeedQFunctionSetCUDAUserFunction_Cuda)); 108 return CEED_ERROR_SUCCESS; 109 } 110 111 //------------------------------------------------------------------------------ 112