// Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC. // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707. // All Rights reserved. See files LICENSE and NOTICE for details. // // This file is part of CEED, a collection of benchmarks, miniapps, software // libraries and APIs for efficient high-order finite element and spectral // element discretizations for exascale applications. For more information and // source code availability see http://github.com/ceed. // // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, // a collaborative effort of two U.S. Department of Energy organizations (Office // of Science and the National Nuclear Security Administration) responsible for // the planning and preparation of a capable exascale ecosystem, including // software, applications, hardware, advanced system engineering and early // testbed platforms, in support of the nation's exascale computing imperative. #include #include #include #include #include #include #include "ceed-cuda-ref.h" //------------------------------------------------------------------------------ // CUDA preferred MemType //------------------------------------------------------------------------------ static int CeedGetPreferredMemType_Cuda(CeedMemType *mem_type) { *mem_type = CEED_MEM_DEVICE; return CEED_ERROR_SUCCESS; } //------------------------------------------------------------------------------ // Get CUBLAS handle //------------------------------------------------------------------------------ int CeedCudaGetCublasHandle(Ceed ceed, cublasHandle_t *handle) { int ierr; Ceed_Cuda *data; ierr = CeedGetData(ceed, &data); CeedChkBackend(ierr); if (!data->cublas_handle) { ierr = cublasCreate(&data->cublas_handle); CeedChk_Cublas(ceed, ierr); } *handle = data->cublas_handle; return CEED_ERROR_SUCCESS; } //------------------------------------------------------------------------------ // Backend Init //------------------------------------------------------------------------------ static int CeedInit_Cuda(const char *resource, Ceed ceed) { int ierr; if (strcmp(resource, "/gpu/cuda/ref")) // LCOV_EXCL_START return CeedError(ceed, CEED_ERROR_BACKEND, "Cuda backend cannot use resource: %s", resource); // LCOV_EXCL_STOP ierr = CeedSetDeterministic(ceed, true); CeedChk(ierr); Ceed_Cuda *data; ierr = CeedCalloc(1, &data); CeedChkBackend(ierr); ierr = CeedSetData(ceed, data); CeedChkBackend(ierr); ierr = CeedCudaInit(ceed, resource); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "GetPreferredMemType", CeedGetPreferredMemType_Cuda); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "VectorCreate", CeedVectorCreate_Cuda); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "BasisCreateTensorH1", CeedBasisCreateTensorH1_Cuda); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "BasisCreateH1", CeedBasisCreateH1_Cuda); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "ElemRestrictionCreate", CeedElemRestrictionCreate_Cuda); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "ElemRestrictionCreateBlocked", CeedElemRestrictionCreateBlocked_Cuda); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "QFunctionCreate", CeedQFunctionCreate_Cuda); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "QFunctionContextCreate", CeedQFunctionContextCreate_Cuda); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "OperatorCreate", CeedOperatorCreate_Cuda); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "CompositeOperatorCreate", CeedCompositeOperatorCreate_Cuda); CeedChkBackend(ierr); ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "Destroy", CeedDestroy_Cuda); CeedChkBackend(ierr); return CEED_ERROR_SUCCESS; } //------------------------------------------------------------------------------ // Backend Register //------------------------------------------------------------------------------ CEED_INTERN int CeedRegister_Cuda(void) { return CeedRegister("/gpu/cuda/ref", CeedInit_Cuda, 40); } //------------------------------------------------------------------------------