| /libCEED/backends/sycl/ |
| H A D | online_compiler.sycl.cpp | 19 void *loadOsLibrary(const std::string &PluginPath) { in loadOsLibrary() 25 …std::cerr << "dlopen(" << PluginPath << ") failed with <" << (Error ? Error : "unknown error") << … in loadOsLibrary() 38 void *getOsLibraryFuncAddress(void *Library, const std::string &FunctionName) { return dlsym(Librar… in getOsLibraryFuncAddress() 40 static std::vector<const char *> prepareOclocArgs(sycl::info::device_type DeviceType, device_arch D… in prepareOclocArgs() 41 … const std::string &DeviceStepping, const std::string &UserArgs) { in prepareOclocArgs() 42 std::vector<const char *> Args = {"ocloc", "-q", "-spv_only", "-device"}; in prepareOclocArgs() 100 static std::vector<byte> compileToSPIRV(const std::string &Source, sycl::info::device_type DeviceTy… in compileToSPIRV() 101 … const std::string &DeviceStepping, void *&CompileToSPIRVHandle, void *&FreeSPIRVOutputsHandle, in compileToSPIRV() 102 const std::vector<std::string> &UserArgs) { in compileToSPIRV() 105 static const std::string OclocLibraryName = "ocloc64.dll"; in compileToSPIRV() [all …]
|
| H A D | ceed-sycl-compile.sycl.cpp | 22 using ByteVector_t = std::vector<unsigned char>; 27 static int CeedJitAddDefinitions_Sycl(Ceed ceed, const std::string &kernel_source, std::string &jit… in CeedJitAddDefinitions_Sycl() 28 const std::map<std::string, CeedInt> &constants = {}) { in CeedJitAddDefinitions_Sycl() 29 std::ostringstream oss; 63 static inline int CeedJitGetFlags_Sycl(std::vector<std::string> &flags) { in CeedJitGetFlags_Sycl() 64 …flags = {std::string("-cl-std=CL3.0"), std::string("-Dint32_t=int"), std::string("-DCEED_RUNNING_J… in CeedJitGetFlags_Sycl() 71 static inline int CeedJitCompileSource_Sycl(Ceed ceed, const sycl::device &sycl_device, const std::… in CeedJitCompileSource_Sycl() 72 const std::vector<std::string> &flags = {}) { in CeedJitCompileSource_Sycl() 124 … CeedBuildModule_Sycl(Ceed ceed, const std::string &kernel_source, SyclModule_t **sycl_module, con… in CeedBuildModule_Sycl() 126 std::string jit_source; in CeedBuildModule_Sycl() [all …]
|
| H A D | online_compiler.hpp | 66 …online_compile_error(const std::string &Msg) : sycl::exception(make_error_code(errc::invalid), Msg… in online_compile_error() 116 std::vector<byte> compile(const std::string &src, const Tys &...args); 157 online_compiler<Lang> &setTargetDeviceStepping(const std::string &id) { in setTargetDeviceStepping() 167 std::pair<int, int> OutputFormatVersion; 179 std::string DeviceStepping; 195 std::vector<byte> online_compiler<source_language::opencl_c>::compile(const std::string &src, const… 211 std::vector<byte> online_compiler<source_language::cm>::compile(const std::string &src, const std::…
|
| H A D | ceed-sycl-compile.hpp | 17 CEED_INTERN int CeedBuildModule_Sycl(Ceed ceed, const std::string &kernel_source, SyclModule_t **sy… 18 const std::map<std::string, CeedInt> &constants = {}); 19 CEED_INTERN int CeedGetKernel_Sycl(Ceed ceed, const SyclModule_t *sycl_module, const std::string &k…
|
| H A D | ceed-sycl-common.sycl.cpp | 20 const char *device_spec = std::strstr(resource, ":device_id="); in CeedInit_Sycl() 24 if (std::strstr(resource, "/gpu/sycl")) { in CeedInit_Sycl() 26 } else if (std::strstr(resource, "/cpu/sycl")) { in CeedInit_Sycl() 54 for (std::exception_ptr const &e : exceptionList) { in CeedInit_Sycl() 56 std::rethrow_exception(e); in CeedInit_Sycl() 58 std::ostringstream error_msg; in CeedInit_Sycl() 60 error_msg << e.what() << std::endl; in CeedInit_Sycl()
|
| /libCEED/examples/deal.II/ |
| H A D | bps-kokkos.cc | 65 std::string libCEED_resource = "/cpu/self"; 70 if (argc == 1 && (std::string(argv[0]) == "--help")) in parse() 72 std::cout << "Usage: ./bp [OPTION]..." << std::endl; in parse() 73 std::cout << std::endl; in parse() 74 std::cout << "--bp name of benchmark (BP1-BP6)" << std::endl; in parse() 75 std::cout << "--n_refinements number of refinements (0-)" << std::endl; in parse() 76 std::cout << "--fe_degree polynomial degree (1-)" << std::endl; in parse() 77 std::cout << "--print_timings name of benchmark (0, 1)" << std::endl; in parse() 78 std::cout << "--resource name of resource (e.g., /cpu/self/avx/blocked)" << std::endl; in parse() 87 std::string label(argv[0]); in parse() [all …]
|
| H A D | bps-cpu.cc | 65 std::string libCEED_resource = "/cpu/self"; 70 if (argc == 1 && (std::string(argv[0]) == "--help")) in parse() 72 std::cout << "Usage: ./bp [OPTION]..." << std::endl; in parse() 73 std::cout << std::endl; in parse() 74 std::cout << "--bp name of benchmark (BP1-BP6)" << std::endl; in parse() 75 std::cout << "--n_refinements number of refinements (0-)" << std::endl; in parse() 76 std::cout << "--fe_degree polynomial degree (1-)" << std::endl; in parse() 77 std::cout << "--print_timings name of benchmark (0, 1)" << std::endl; in parse() 78 std::cout << "--resource name of resource (e.g., /cpu/self/avx/blocked)" << std::endl; in parse() 87 std::string label(argv[0]); in parse() [all …]
|
| H A D | bps-ceed.h | 64 const std::string &resource) in OperatorCeed() 124 std::vector<CeedScalar> q_ref_1d; in reinit() 129 std::vector<CeedScalar> interp_1d(shape_data.shape_values.size()); in reinit() 130 std::vector<CeedScalar> grad_1d(shape_data.shape_gradients.size()); in reinit() 158 std::make_shared<Utilities::MPI::Partitioner>(dof_handler.locally_owned_dofs(), in reinit() 163 std::vector<CeedInt> indices; in reinit() 168 std::vector<types::global_dof_index> local_indices(fe.n_dofs_per_cell()); in reinit() 325 i = (std::abs(i) > 1.0e-10) ? (1.0 / i) : 1.0; in compute_inverse_diagonal() 417 static std::vector<double> 424 std::vector<double> metric_data_raw; in compute_metric_data() [all …]
|
| /libCEED/backends/magma/tuning/ |
| H A D | a100.h | 5 std::vector<std::array<int, RECORD_LENGTH> > sgemm_nn_a100 = { 617 std::vector<std::array<int, RECORD_LENGTH> > sgemm_tn_a100 = { 1229 std::vector<std::array<int, RECORD_LENGTH> > dgemm_nn_a100 = { 1841 std::vector<std::array<int, RECORD_LENGTH> > dgemm_tn_a100 = {
|
| H A D | mi250x.h | 5 std::vector<std::array<int, RECORD_LENGTH> > sgemm_nn_mi250x = { 617 std::vector<std::array<int, RECORD_LENGTH> > sgemm_tn_mi250x = { 1229 std::vector<std::array<int, RECORD_LENGTH> > dgemm_nn_mi250x = { 1841 std::vector<std::array<int, RECORD_LENGTH> > dgemm_tn_mi250x = {
|
| H A D | mi100.h | 5 std::vector<std::array<int, RECORD_LENGTH> > sgemm_nn_mi100 = { 617 std::vector<std::array<int, RECORD_LENGTH> > sgemm_tn_mi100 = { 1229 std::vector<std::array<int, RECORD_LENGTH> > dgemm_nn_mi100 = { 1841 std::vector<std::array<int, RECORD_LENGTH> > dgemm_tn_mi100 = {
|
| H A D | v100.h | 5 std::vector<std::array<int, RECORD_LENGTH> > sgemm_nn_v100 = { 617 std::vector<std::array<int, RECORD_LENGTH> > sgemm_tn_v100 = { 1229 std::vector<std::array<int, RECORD_LENGTH> > dgemm_nn_v100 = { 1841 std::vector<std::array<int, RECORD_LENGTH> > dgemm_tn_v100 = {
|
| H A D | tuning.cpp | 20 constexpr static std::array<std::array<int, 3>, 22> PQ_VALUES = { 28 constexpr static std::array<std::pair<int, int>, 7> N_VALUES = { 32 using Clock = std::chrono::steady_clock; 33 using Duration = std::chrono::duration<double>; 38 std::random_device rand_device; in main() 39 std::default_random_engine rand_engine(rand_device()); in main() 40 std::uniform_real_distribution<> rand_dist(0.0, 1.0); in main() 54 std::vector<double> q_ref(dim * Q, 0.0), q_weight(Q, 0.0), interp(P * Q), grad(P * Q * dim); in main() 55 std::generate(interp.begin(), interp.end(), generate_random); in main() 56 std::generate(grad.begin(), grad.end(), generate_random); in main() [all …]
|
| H A D | a100_rtc.h | 5 std::vector<std::array<int, RECORD_LENGTH_RTC> > drtc_t_a100 = { 317 std::vector<std::array<int, RECORD_LENGTH_RTC> > drtc_n_a100 = {
|
| H A D | mi250x_rtc.h | 5 std::vector<std::array<int, RECORD_LENGTH_RTC> > drtc_t_mi250x = { 317 std::vector<std::array<int, RECORD_LENGTH_RTC> > drtc_n_mi250x = {
|
| H A D | mi100_rtc.h | 5 std::vector<std::array<int, RECORD_LENGTH_RTC> > drtc_t_mi100 = { 317 std::vector<std::array<int, RECORD_LENGTH_RTC> > drtc_n_mi100 = {
|
| H A D | v100_rtc.h | 5 std::vector<std::array<int, RECORD_LENGTH_RTC> > drtc_t_v100 = { 317 std::vector<std::array<int, RECORD_LENGTH_RTC> > drtc_n_v100 = {
|
| H A D | h100_rtc.h | 5 std::vector<std::array<int, RECORD_LENGTH_RTC> > drtc_t_h100 = { 317 std::vector<std::array<int, RECORD_LENGTH_RTC> > drtc_n_h100 = {
|
| /libCEED/backends/cuda/ |
| H A D | ceed-cuda-compile.cpp | 49 FILE *output_stream = popen((command + std::string(" 2>&1")).c_str(), "r"); in CeedCallSystem_Core() 54 std::string output = ""; in CeedCallSystem_Core() 67 using std::ifstream; 68 using std::ofstream; 69 using std::ostringstream; 84 std::ostringstream code; in CeedCompileCore_Cuda() 114 std::string arch_arg = in CeedCompileCore_Cuda() 124 + std::to_string(prop.major) + std::to_string(prop.minor); in CeedCompileCore_Cuda() 135 std::ostringstream include_dir_arg; in CeedCompileCore_Cuda() 149 std::ostringstream define_arg; in CeedCompileCore_Cuda() [all …]
|
| /libCEED/rust/libceed/src/ |
| H A D | qfunction.rs | 11 use std::pin::Pin; 48 let mut name_ptr: *mut std::os::raw::c_char = std::ptr::null_mut(); in name() 378 let mut ptr = std::ptr::null_mut(); in fmt() 456 let mut u_c = [std::ptr::null_mut(); MAX_QFUNCTION_FIELDS]; in apply() 457 for i in 0..std::cmp::min(MAX_QFUNCTION_FIELDS, u.len()) { in apply() 460 let mut v_c = [std::ptr::null_mut(); MAX_QFUNCTION_FIELDS]; in apply() 461 for i in 0..std::cmp::min(MAX_QFUNCTION_FIELDS, v.len()) { in apply() 473 let mut inputs_ptr = std::ptr::null_mut(); in inputs() 479 std::ptr::null_mut() as *mut bind_ceed::CeedInt, in inputs() 480 std::ptr::null_mut(), in inputs() [all …]
|
| H A D | operator.rs | 41 let mut vector_ptr = std::ptr::null_mut(); in from_raw() 46 let mut elem_restriction_ptr = std::ptr::null_mut(); in from_raw() 54 let mut basis_ptr = std::ptr::null_mut(); in from_raw() 104 let mut name_ptr: *mut std::os::raw::c_char = std::ptr::null_mut(); in name() 334 let mut ptr = std::ptr::null_mut(); in fmt() 548 let mut ptr = std::ptr::null_mut(); in create() 862 let mut inputs_ptr = std::ptr::null_mut(); in inputs() 868 std::ptr::null_mut() as *mut bind_ceed::CeedInt, in inputs() 869 std::ptr::null_mut(), in inputs() 874 std::slice::from_raw_parts( in inputs() [all …]
|
| /libCEED/examples/mfem/ |
| H A D | bp1.cpp | 70 args.PrintUsage(std::cout); in main() 74 args.PrintOptions(std::cout); in main() 107 std::cout << "Number of finite element unknowns: " << fespace->GetTrueVSize() << std::endl; in main() 137 std::cout << "L2 projection error: " << err_l2 << std::endl; in main() 140 std::cout << "Error too large: " << err_l2 << std::endl; in main() 150 sol_sock << "solution\n" << *mesh << sol << std::flush; in main()
|
| H A D | bp3.cpp | 92 args.PrintUsage(std::cout); in main() 96 args.PrintOptions(std::cout); in main() 129 std::cout << "Number of finite element unknowns: " << fespace->GetTrueVSize() << std::endl; in main() 171 std::cout << "L2 projection error: " << err_l2 << std::endl; in main() 174 std::cout << "Error too large: " << err_l2 << std::endl; in main() 184 sol_sock << "solution\n" << *mesh << sol << std::flush; in main()
|
| /libCEED/backends/sycl-ref/ |
| H A D | ceed-sycl-ref-qfunction-load.sycl.cpp | 48 std::vector<CeedInt> input_sizes(num_input_fields); in CeedQFunctionBuildKernel_Sycl() 56 std::vector<CeedInt> output_sizes(num_output_fields); in CeedQFunctionBuildKernel_Sycl() 81 std::string_view qf_name_view(qfunction_name); in CeedQFunctionBuildKernel_Sycl() 82 std::string_view qf_source_view(qfunction_source); in CeedQFunctionBuildKernel_Sycl() 83 std::string_view rw_source_view(read_write_kernel_source); in CeedQFunctionBuildKernel_Sycl() 84 const std::string kernel_name = "CeedKernelSyclRefQFunction_" + std::string(qf_name_view); in CeedQFunctionBuildKernel_Sycl() 87 std::ostringstream code; in CeedQFunctionBuildKernel_Sycl()
|
| /libCEED/backends/sycl-shared/ |
| H A D | ceed-sycl-shared.sycl.cpp | 26 …CeedCheck(!std::strcmp(resource_root, "/gpu/sycl/shared") || !std::strcmp(resource_root, "/cpu/syc… in CeedInit_Sycl_shared() 28 std::string_view root_view = resource_root; in CeedInit_Sycl_shared() 33 std::ostringstream ref_resource; in CeedInit_Sycl_shared()
|