1 // Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC. 2 // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707. 3 // All Rights reserved. See files LICENSE and NOTICE for details. 4 // 5 // This file is part of CEED, a collection of benchmarks, miniapps, software 6 // libraries and APIs for efficient high-order finite element and spectral 7 // element discretizations for exascale applications. For more information and 8 // source code availability see http://github.com/ceed. 9 // 10 // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 11 // a collaborative effort of two U.S. Department of Energy organizations (Office 12 // of Science and the National Nuclear Security Administration) responsible for 13 // the planning and preparation of a capable exascale ecosystem, including 14 // software, applications, hardware, advanced system engineering and early 15 // testbed platforms, in support of the nation's exascale computing imperative. 16 17 #include <ceed/ceed.h> 18 #include <ceed/backend.h> 19 #include <cublas_v2.h> 20 #include <cuda.h> 21 #include <cuda_runtime.h> 22 #include <string.h> 23 #include "ceed-cuda-ref.h" 24 25 //------------------------------------------------------------------------------ 26 // CUDA preferred MemType 27 //------------------------------------------------------------------------------ 28 static int CeedGetPreferredMemType_Cuda(CeedMemType *type) { 29 *type = CEED_MEM_DEVICE; 30 return CEED_ERROR_SUCCESS; 31 } 32 33 //------------------------------------------------------------------------------ 34 // Get CUBLAS handle 35 //------------------------------------------------------------------------------ 36 int CeedCudaGetCublasHandle(Ceed ceed, cublasHandle_t *handle) { 37 int ierr; 38 Ceed_Cuda *data; 39 ierr = CeedGetData(ceed, &data); CeedChkBackend(ierr); 40 41 if (!data->cublas_handle) { 42 ierr = cublasCreate(&data->cublas_handle); CeedChk_Cublas(ceed, ierr); 43 } 44 *handle = data->cublas_handle; 45 return CEED_ERROR_SUCCESS; 46 } 47 48 //------------------------------------------------------------------------------ 49 // Backend Init 50 //------------------------------------------------------------------------------ 51 static int CeedInit_Cuda(const char *resource, Ceed ceed) { 52 int ierr; 53 54 if (strcmp(resource, "/gpu/cuda/ref")) 55 // LCOV_EXCL_START 56 return CeedError(ceed, CEED_ERROR_BACKEND, 57 "Cuda backend cannot use resource: %s", resource); 58 // LCOV_EXCL_STOP 59 ierr = CeedSetDeterministic(ceed, true); CeedChk(ierr); 60 61 Ceed_Cuda *data; 62 ierr = CeedCalloc(1, &data); CeedChkBackend(ierr); 63 ierr = CeedSetData(ceed, data); CeedChkBackend(ierr); 64 ierr = CeedCudaInit(ceed, resource); CeedChkBackend(ierr); 65 66 ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "GetPreferredMemType", 67 CeedGetPreferredMemType_Cuda); CeedChkBackend(ierr); 68 ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "VectorCreate", 69 CeedVectorCreate_Cuda); CeedChkBackend(ierr); 70 ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "BasisCreateTensorH1", 71 CeedBasisCreateTensorH1_Cuda); CeedChkBackend(ierr); 72 ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "BasisCreateH1", 73 CeedBasisCreateH1_Cuda); CeedChkBackend(ierr); 74 ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "ElemRestrictionCreate", 75 CeedElemRestrictionCreate_Cuda); CeedChkBackend(ierr); 76 ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, 77 "ElemRestrictionCreateBlocked", 78 CeedElemRestrictionCreateBlocked_Cuda); 79 CeedChkBackend(ierr); 80 ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "QFunctionCreate", 81 CeedQFunctionCreate_Cuda); CeedChkBackend(ierr); 82 ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "QFunctionContextCreate", 83 CeedQFunctionContextCreate_Cuda); CeedChkBackend(ierr); 84 ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "OperatorCreate", 85 CeedOperatorCreate_Cuda); CeedChkBackend(ierr); 86 ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "CompositeOperatorCreate", 87 CeedCompositeOperatorCreate_Cuda); CeedChkBackend(ierr); 88 ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "Destroy", 89 CeedDestroy_Cuda); CeedChkBackend(ierr); 90 return CEED_ERROR_SUCCESS; 91 } 92 93 //------------------------------------------------------------------------------ 94 // Backend Register 95 //------------------------------------------------------------------------------ 96 CEED_INTERN int CeedRegister_Cuda(void) { 97 return CeedRegister("/gpu/cuda/ref", CeedInit_Cuda, 40); 98 } 99 //------------------------------------------------------------------------------ 100