xref: /libCEED/backends/avx/ceed-avx-blocked.c (revision 3f21f6b10abeb5d85d3454ea5cd38498737dc88a)
1 // Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC.
2 // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707.
3 // All Rights reserved. See files LICENSE and NOTICE for details.
4 //
5 // This file is part of CEED, a collection of benchmarks, miniapps, software
6 // libraries and APIs for efficient high-order finite element and spectral
7 // element discretizations for exascale applications. For more information and
8 // source code availability see http://github.com/ceed.
9 //
10 // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
11 // a collaborative effort of two U.S. Department of Energy organizations (Office
12 // of Science and the National Nuclear Security Administration) responsible for
13 // the planning and preparation of a capable exascale ecosystem, including
14 // software, applications, hardware, advanced system engineering and early
15 // testbed platforms, in support of the nation's exascale computing imperative.
16 
17 #include <ceed/ceed.h>
18 #include <ceed/backend.h>
19 #include <stdbool.h>
20 #include <string.h>
21 #include "ceed-avx.h"
22 
23 //------------------------------------------------------------------------------
24 // Backend Init
25 //------------------------------------------------------------------------------
26 static int CeedInit_Avx(const char *resource, Ceed ceed) {
27   int ierr;
28   if (strcmp(resource, "/cpu/self") && strcmp(resource, "/cpu/self/avx") &&
29       strcmp(resource, "/cpu/self/avx/blocked"))
30     // LCOV_EXCL_START
31     return CeedError(ceed, CEED_ERROR_BACKEND,
32                      "AVX backend cannot use resource: %s", resource);
33   // LCOV_EXCL_STOP
34   ierr = CeedSetDeterministic(ceed, true); CeedChkBackend(ierr);
35 
36   // Create reference CEED that implementation will be dispatched
37   //   through unless overridden
38   Ceed ceed_ref;
39   CeedInit("/cpu/self/opt/blocked", &ceed_ref);
40   ierr = CeedSetDelegate(ceed, ceed_ref); CeedChkBackend(ierr);
41 
42   if (CEED_SCALAR_TYPE == CEED_SCALAR_FP64) {
43     ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "TensorContractCreate",
44                                   CeedTensorContractCreate_f64_Avx);
45     CeedChkBackend(ierr);
46   } else {
47     ierr = CeedSetBackendFunction(ceed, "Ceed", ceed, "TensorContractCreate",
48                                   CeedTensorContractCreate_f32_Avx);
49     CeedChkBackend(ierr);
50   }
51 
52   return CEED_ERROR_SUCCESS;
53 }
54 
55 //------------------------------------------------------------------------------
56 // Backend Register
57 //------------------------------------------------------------------------------
58 CEED_INTERN int CeedRegister_Avx_Blocked(void) {
59   return CeedRegister("/cpu/self/avx/blocked", CeedInit_Avx, 30);
60 }
61 //------------------------------------------------------------------------------
62