xref: /libCEED/rust/libceed-sys/c-src/backends/sycl-ref/ceed-sycl-vector.sycl.cpp (revision 1f4b1b45844fd6ef75549b644944f35065f07aef)
15aed82e4SJeremy L Thompson // Copyright (c) 2017-2024, Lawrence Livermore National Security, LLC and other CEED contributors.
2bd882c8aSJames Wright // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
3bd882c8aSJames Wright //
4bd882c8aSJames Wright // SPDX-License-Identifier: BSD-2-Clause
5bd882c8aSJames Wright //
6bd882c8aSJames Wright // This file is part of CEED:  http://github.com/ceed
7bd882c8aSJames Wright 
8bd882c8aSJames Wright #include <ceed/backend.h>
9bd882c8aSJames Wright #include <ceed/ceed.h>
10bd882c8aSJames Wright 
11bd882c8aSJames Wright #include <cmath>
12bd882c8aSJames Wright #include <string>
13bd882c8aSJames Wright #include <sycl/sycl.hpp>
14bd882c8aSJames Wright 
15bd882c8aSJames Wright #include "ceed-sycl-ref.hpp"
16bd882c8aSJames Wright 
17bd882c8aSJames Wright //------------------------------------------------------------------------------
18bd882c8aSJames Wright // Check if host/device sync is needed
19bd882c8aSJames Wright //------------------------------------------------------------------------------
20bd882c8aSJames Wright static inline int CeedVectorNeedSync_Sycl(const CeedVector vec, CeedMemType mem_type, bool *need_sync) {
21bd882c8aSJames Wright   bool             has_valid_array = false;
22dd64fc84SJeremy L Thompson   CeedVector_Sycl *impl;
23dd64fc84SJeremy L Thompson 
24dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(vec, &impl));
25bd882c8aSJames Wright   CeedCallBackend(CeedVectorHasValidArray(vec, &has_valid_array));
26bd882c8aSJames Wright   switch (mem_type) {
27bd882c8aSJames Wright     case CEED_MEM_HOST:
28bd882c8aSJames Wright       *need_sync = has_valid_array && !impl->h_array;
29bd882c8aSJames Wright       break;
30bd882c8aSJames Wright     case CEED_MEM_DEVICE:
31bd882c8aSJames Wright       *need_sync = has_valid_array && !impl->d_array;
32bd882c8aSJames Wright       break;
33bd882c8aSJames Wright   }
34bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
35bd882c8aSJames Wright }
36bd882c8aSJames Wright 
37bd882c8aSJames Wright //------------------------------------------------------------------------------
38bd882c8aSJames Wright // Sync host to device
39bd882c8aSJames Wright //------------------------------------------------------------------------------
40bd882c8aSJames Wright static inline int CeedVectorSyncH2D_Sycl(const CeedVector vec) {
41bd882c8aSJames Wright   Ceed             ceed;
42bd882c8aSJames Wright   Ceed_Sycl       *data;
43dd64fc84SJeremy L Thompson   CeedSize         length;
44dd64fc84SJeremy L Thompson   CeedVector_Sycl *impl;
45dd64fc84SJeremy L Thompson 
46dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
47dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(vec, &impl));
48bd882c8aSJames Wright   CeedCallBackend(CeedGetData(ceed, &data));
494e3038a5SJeremy L Thompson   CeedCheck(impl->h_array, ceed, CEED_ERROR_BACKEND, "No valid host data to sync to device");
50bd882c8aSJames Wright 
51bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetLength(vec, &length));
52bd882c8aSJames Wright   if (impl->d_array_borrowed) {
53bd882c8aSJames Wright     impl->d_array = impl->d_array_borrowed;
54bd882c8aSJames Wright   } else if (impl->d_array_owned) {
55bd882c8aSJames Wright     impl->d_array = impl->d_array_owned;
56bd882c8aSJames Wright   } else {
57bd882c8aSJames Wright     CeedCallSycl(ceed, impl->d_array_owned = sycl::malloc_device<CeedScalar>(length, data->sycl_device, data->sycl_context));
58bd882c8aSJames Wright     impl->d_array = impl->d_array_owned;
59bd882c8aSJames Wright   }
60bd882c8aSJames Wright 
61bd882c8aSJames Wright   // Copy from host to device
62*1f4b1b45SUmesh Unnikrishnan   std::vector<sycl::event> e;
63*1f4b1b45SUmesh Unnikrishnan 
64*1f4b1b45SUmesh Unnikrishnan   if (!data->sycl_queue.is_in_order()) e = {data->sycl_queue.ext_oneapi_submit_barrier()};
65*1f4b1b45SUmesh Unnikrishnan   CeedCallSycl(ceed, data->sycl_queue.copy<CeedScalar>(impl->h_array, impl->d_array, length, e).wait_and_throw());
66bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
67bd882c8aSJames Wright }
68bd882c8aSJames Wright 
69bd882c8aSJames Wright //------------------------------------------------------------------------------
70bd882c8aSJames Wright // Sync device to host
71bd882c8aSJames Wright //------------------------------------------------------------------------------
72bd882c8aSJames Wright static inline int CeedVectorSyncD2H_Sycl(const CeedVector vec) {
73bd882c8aSJames Wright   Ceed             ceed;
74bd882c8aSJames Wright   Ceed_Sycl       *data;
75dd64fc84SJeremy L Thompson   CeedSize         length;
76dd64fc84SJeremy L Thompson   CeedVector_Sycl *impl;
77dd64fc84SJeremy L Thompson 
78dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
79dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(vec, &impl));
80bd882c8aSJames Wright   CeedCallBackend(CeedGetData(ceed, &data));
81bd882c8aSJames Wright 
82bd882c8aSJames Wright   CeedCheck(impl->d_array, ceed, CEED_ERROR_BACKEND, "No valid device data to sync to host");
83bd882c8aSJames Wright 
84bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetLength(vec, &length));
85bd882c8aSJames Wright   if (impl->h_array_borrowed) {
86bd882c8aSJames Wright     impl->h_array = impl->h_array_borrowed;
87bd882c8aSJames Wright   } else if (impl->h_array_owned) {
88bd882c8aSJames Wright     impl->h_array = impl->h_array_owned;
89bd882c8aSJames Wright   } else {
90bd882c8aSJames Wright     CeedCallBackend(CeedCalloc(length, &impl->h_array_owned));
91bd882c8aSJames Wright     impl->h_array = impl->h_array_owned;
92bd882c8aSJames Wright   }
93bd882c8aSJames Wright 
94bd882c8aSJames Wright   // Copy from device to host
95*1f4b1b45SUmesh Unnikrishnan   std::vector<sycl::event> e;
96*1f4b1b45SUmesh Unnikrishnan 
97*1f4b1b45SUmesh Unnikrishnan   if (!data->sycl_queue.is_in_order()) e = {data->sycl_queue.ext_oneapi_submit_barrier()};
98*1f4b1b45SUmesh Unnikrishnan   CeedCallSycl(ceed, data->sycl_queue.copy<CeedScalar>(impl->d_array, impl->h_array, length, e).wait_and_throw());
99bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
100bd882c8aSJames Wright }
101bd882c8aSJames Wright 
102bd882c8aSJames Wright //------------------------------------------------------------------------------
103bd882c8aSJames Wright // Sync arrays
104bd882c8aSJames Wright //------------------------------------------------------------------------------
105bd882c8aSJames Wright static int CeedVectorSyncArray_Sycl(const CeedVector vec, CeedMemType mem_type) {
106bd882c8aSJames Wright   bool need_sync = false;
107dd64fc84SJeremy L Thompson 
108dd64fc84SJeremy L Thompson   // Check whether device/host sync is needed
109bd882c8aSJames Wright   CeedCallBackend(CeedVectorNeedSync_Sycl(vec, mem_type, &need_sync));
110bd882c8aSJames Wright   if (!need_sync) return CEED_ERROR_SUCCESS;
111bd882c8aSJames Wright 
112bd882c8aSJames Wright   switch (mem_type) {
113bd882c8aSJames Wright     case CEED_MEM_HOST:
114bd882c8aSJames Wright       return CeedVectorSyncD2H_Sycl(vec);
115bd882c8aSJames Wright     case CEED_MEM_DEVICE:
116bd882c8aSJames Wright       return CeedVectorSyncH2D_Sycl(vec);
117bd882c8aSJames Wright   }
118bd882c8aSJames Wright   return CEED_ERROR_UNSUPPORTED;
119bd882c8aSJames Wright }
120bd882c8aSJames Wright 
121bd882c8aSJames Wright //------------------------------------------------------------------------------
122bd882c8aSJames Wright // Set all pointers as invalid
123bd882c8aSJames Wright //------------------------------------------------------------------------------
124bd882c8aSJames Wright static inline int CeedVectorSetAllInvalid_Sycl(const CeedVector vec) {
125bd882c8aSJames Wright   CeedVector_Sycl *impl;
126bd882c8aSJames Wright 
127dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(vec, &impl));
128bd882c8aSJames Wright   impl->h_array = NULL;
129bd882c8aSJames Wright   impl->d_array = NULL;
130bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
131bd882c8aSJames Wright }
132bd882c8aSJames Wright 
133bd882c8aSJames Wright //------------------------------------------------------------------------------
134bd882c8aSJames Wright // Check if CeedVector has any valid pointer
135bd882c8aSJames Wright //------------------------------------------------------------------------------
136bd882c8aSJames Wright static inline int CeedVectorHasValidArray_Sycl(const CeedVector vec, bool *has_valid_array) {
137bd882c8aSJames Wright   CeedVector_Sycl *impl;
138dd64fc84SJeremy L Thompson 
139bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetData(vec, &impl));
1401c66c397SJeremy L Thompson   *has_valid_array = impl->h_array || impl->d_array;
141bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
142bd882c8aSJames Wright }
143bd882c8aSJames Wright 
144bd882c8aSJames Wright //------------------------------------------------------------------------------
145bd882c8aSJames Wright // Check if has array of given type
146bd882c8aSJames Wright //------------------------------------------------------------------------------
147bd882c8aSJames Wright static inline int CeedVectorHasArrayOfType_Sycl(const CeedVector vec, CeedMemType mem_type, bool *has_array_of_type) {
148bd882c8aSJames Wright   CeedVector_Sycl *impl;
149bd882c8aSJames Wright 
150dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(vec, &impl));
151bd882c8aSJames Wright   switch (mem_type) {
152bd882c8aSJames Wright     case CEED_MEM_HOST:
1531c66c397SJeremy L Thompson       *has_array_of_type = impl->h_array_borrowed || impl->h_array_owned;
154bd882c8aSJames Wright       break;
155bd882c8aSJames Wright     case CEED_MEM_DEVICE:
1561c66c397SJeremy L Thompson       *has_array_of_type = impl->d_array_borrowed || impl->d_array_owned;
157bd882c8aSJames Wright       break;
158bd882c8aSJames Wright   }
159bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
160bd882c8aSJames Wright }
161bd882c8aSJames Wright 
162bd882c8aSJames Wright //------------------------------------------------------------------------------
163bd882c8aSJames Wright // Check if has borrowed array of given type
164bd882c8aSJames Wright //------------------------------------------------------------------------------
165bd882c8aSJames Wright static inline int CeedVectorHasBorrowedArrayOfType_Sycl(const CeedVector vec, CeedMemType mem_type, bool *has_borrowed_array_of_type) {
166bd882c8aSJames Wright   CeedVector_Sycl *impl;
167bd882c8aSJames Wright 
168dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(vec, &impl));
169bd882c8aSJames Wright   switch (mem_type) {
170bd882c8aSJames Wright     case CEED_MEM_HOST:
1711c66c397SJeremy L Thompson       *has_borrowed_array_of_type = impl->h_array_borrowed;
172bd882c8aSJames Wright       break;
173bd882c8aSJames Wright     case CEED_MEM_DEVICE:
1741c66c397SJeremy L Thompson       *has_borrowed_array_of_type = impl->d_array_borrowed;
175bd882c8aSJames Wright       break;
176bd882c8aSJames Wright   }
177bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
178bd882c8aSJames Wright }
179bd882c8aSJames Wright 
180bd882c8aSJames Wright //------------------------------------------------------------------------------
181bd882c8aSJames Wright // Set array from host
182bd882c8aSJames Wright //------------------------------------------------------------------------------
183bd882c8aSJames Wright static int CeedVectorSetArrayHost_Sycl(const CeedVector vec, const CeedCopyMode copy_mode, CeedScalar *array) {
184f59ebe5eSJeremy L Thompson   CeedSize         length;
185bd882c8aSJames Wright   CeedVector_Sycl *impl;
186bd882c8aSJames Wright 
187dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(vec, &impl));
188f59ebe5eSJeremy L Thompson   CeedCallBackend(CeedVectorGetLength(vec, &length));
189f59ebe5eSJeremy L Thompson 
190f5d1e504SJeremy L Thompson   CeedCallBackend(CeedSetHostCeedScalarArray(array, copy_mode, length, (const CeedScalar **)&impl->h_array_owned,
191f5d1e504SJeremy L Thompson                                              (const CeedScalar **)&impl->h_array_borrowed, (const CeedScalar **)&impl->h_array));
192bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
193bd882c8aSJames Wright }
194bd882c8aSJames Wright 
195bd882c8aSJames Wright //------------------------------------------------------------------------------
196bd882c8aSJames Wright // Set array from device
197bd882c8aSJames Wright //------------------------------------------------------------------------------
198bd882c8aSJames Wright static int CeedVectorSetArrayDevice_Sycl(const CeedVector vec, const CeedCopyMode copy_mode, CeedScalar *array) {
199f59ebe5eSJeremy L Thompson   CeedSize         length;
200bd882c8aSJames Wright   Ceed             ceed;
201bd882c8aSJames Wright   Ceed_Sycl       *data;
202dd64fc84SJeremy L Thompson   CeedVector_Sycl *impl;
203dd64fc84SJeremy L Thompson 
204dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
205dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(vec, &impl));
206bd882c8aSJames Wright   CeedCallBackend(CeedGetData(ceed, &data));
207f59ebe5eSJeremy L Thompson   CeedCallBackend(CeedVectorGetLength(vec, &length));
208bd882c8aSJames Wright 
209*1f4b1b45SUmesh Unnikrishnan   // Order queue if needed.
210*1f4b1b45SUmesh Unnikrishnan   std::vector<sycl::event> e;
211*1f4b1b45SUmesh Unnikrishnan 
212*1f4b1b45SUmesh Unnikrishnan   if (!data->sycl_queue.is_in_order()) e = {data->sycl_queue.ext_oneapi_submit_barrier()};
213bd882c8aSJames Wright 
214bd882c8aSJames Wright   switch (copy_mode) {
215bd882c8aSJames Wright     case CEED_COPY_VALUES: {
216e588e9b3SJeremy L Thompson       if (!impl->d_array_owned) {
217bd882c8aSJames Wright         CeedCallSycl(ceed, impl->d_array_owned = sycl::malloc_device<CeedScalar>(length, data->sycl_device, data->sycl_context));
218e588e9b3SJeremy L Thompson       }
219bd882c8aSJames Wright       if (array) {
220bd882c8aSJames Wright         // Wait for copy to finish and handle exceptions.
221*1f4b1b45SUmesh Unnikrishnan         CeedCallSycl(ceed, data->sycl_queue.copy<CeedScalar>(array, impl->d_array_owned, length, e).wait_and_throw());
222bd882c8aSJames Wright       }
223f59ebe5eSJeremy L Thompson       impl->d_array_borrowed = NULL;
224f59ebe5eSJeremy L Thompson       impl->d_array          = impl->d_array_owned;
225bd882c8aSJames Wright     } break;
226bd882c8aSJames Wright     case CEED_OWN_POINTER:
227bd882c8aSJames Wright       if (impl->d_array_owned) {
228bd882c8aSJames Wright         // Wait for all work to finish before freeing memory
229bd882c8aSJames Wright         CeedCallSycl(ceed, data->sycl_queue.wait_and_throw());
230bd882c8aSJames Wright         CeedCallSycl(ceed, sycl::free(impl->d_array_owned, data->sycl_context));
231bd882c8aSJames Wright       }
232bd882c8aSJames Wright       impl->d_array_owned    = array;
233bd882c8aSJames Wright       impl->d_array_borrowed = NULL;
234f59ebe5eSJeremy L Thompson       impl->d_array          = impl->d_array_owned;
235bd882c8aSJames Wright       break;
236bd882c8aSJames Wright     case CEED_USE_POINTER:
237bd882c8aSJames Wright       if (impl->d_array_owned) {
238bd882c8aSJames Wright         // Wait for all work to finish before freeing memory
239bd882c8aSJames Wright         CeedCallSycl(ceed, data->sycl_queue.wait_and_throw());
240bd882c8aSJames Wright         CeedCallSycl(ceed, sycl::free(impl->d_array_owned, data->sycl_context));
241bd882c8aSJames Wright       }
242bd882c8aSJames Wright       impl->d_array_owned    = NULL;
243bd882c8aSJames Wright       impl->d_array_borrowed = array;
244f59ebe5eSJeremy L Thompson       impl->d_array          = impl->d_array_borrowed;
245bd882c8aSJames Wright       break;
246bd882c8aSJames Wright   }
247bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
248bd882c8aSJames Wright }
249bd882c8aSJames Wright 
250bd882c8aSJames Wright //------------------------------------------------------------------------------
251bd882c8aSJames Wright // Set the array used by a vector,
252bd882c8aSJames Wright //   freeing any previously allocated array if applicable
253bd882c8aSJames Wright //------------------------------------------------------------------------------
254bd882c8aSJames Wright static int CeedVectorSetArray_Sycl(const CeedVector vec, const CeedMemType mem_type, const CeedCopyMode copy_mode, CeedScalar *array) {
255bd882c8aSJames Wright   CeedVector_Sycl *impl;
256dd64fc84SJeremy L Thompson 
257bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetData(vec, &impl));
258bd882c8aSJames Wright 
259bd882c8aSJames Wright   CeedCallBackend(CeedVectorSetAllInvalid_Sycl(vec));
260bd882c8aSJames Wright   switch (mem_type) {
261bd882c8aSJames Wright     case CEED_MEM_HOST:
262bd882c8aSJames Wright       return CeedVectorSetArrayHost_Sycl(vec, copy_mode, array);
263bd882c8aSJames Wright     case CEED_MEM_DEVICE:
264bd882c8aSJames Wright       return CeedVectorSetArrayDevice_Sycl(vec, copy_mode, array);
265bd882c8aSJames Wright   }
266bd882c8aSJames Wright   return CEED_ERROR_UNSUPPORTED;
267bd882c8aSJames Wright }
268bd882c8aSJames Wright 
269bd882c8aSJames Wright //------------------------------------------------------------------------------
270bd882c8aSJames Wright // Set host array to value
271bd882c8aSJames Wright //------------------------------------------------------------------------------
2726ca0f394SUmesh Unnikrishnan static int CeedHostSetValue_Sycl(CeedScalar *h_array, CeedSize length, CeedScalar val) {
2736ca0f394SUmesh Unnikrishnan   for (CeedSize i = 0; i < length; i++) h_array[i] = val;
274bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
275bd882c8aSJames Wright }
276bd882c8aSJames Wright 
277bd882c8aSJames Wright //------------------------------------------------------------------------------
278bd882c8aSJames Wright // Set device array to value
279bd882c8aSJames Wright //------------------------------------------------------------------------------
2806ca0f394SUmesh Unnikrishnan static int CeedDeviceSetValue_Sycl(sycl::queue &sycl_queue, CeedScalar *d_array, CeedSize length, CeedScalar val) {
281*1f4b1b45SUmesh Unnikrishnan   std::vector<sycl::event> e;
282*1f4b1b45SUmesh Unnikrishnan 
283*1f4b1b45SUmesh Unnikrishnan   if (!sycl_queue.is_in_order()) e = {sycl_queue.ext_oneapi_submit_barrier()};
284*1f4b1b45SUmesh Unnikrishnan   sycl_queue.fill(d_array, val, length, e);
285bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
286bd882c8aSJames Wright }
287bd882c8aSJames Wright 
288bd882c8aSJames Wright //------------------------------------------------------------------------------
289bd882c8aSJames Wright // Set a vector to a value,
290bd882c8aSJames Wright //------------------------------------------------------------------------------
291bd882c8aSJames Wright static int CeedVectorSetValue_Sycl(CeedVector vec, CeedScalar val) {
292bd882c8aSJames Wright   Ceed             ceed;
293bd882c8aSJames Wright   Ceed_Sycl       *data;
294dd64fc84SJeremy L Thompson   CeedSize         length;
295dd64fc84SJeremy L Thompson   CeedVector_Sycl *impl;
296dd64fc84SJeremy L Thompson 
297dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
298dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(vec, &impl));
299dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetLength(vec, &length));
300bd882c8aSJames Wright   CeedCallBackend(CeedGetData(ceed, &data));
301bd882c8aSJames Wright 
302bd882c8aSJames Wright   // Set value for synced device/host array
303bd882c8aSJames Wright   if (!impl->d_array && !impl->h_array) {
304bd882c8aSJames Wright     if (impl->d_array_borrowed) {
305bd882c8aSJames Wright       impl->d_array = impl->d_array_borrowed;
306bd882c8aSJames Wright     } else if (impl->h_array_borrowed) {
307bd882c8aSJames Wright       impl->h_array = impl->h_array_borrowed;
308bd882c8aSJames Wright     } else if (impl->d_array_owned) {
309bd882c8aSJames Wright       impl->d_array = impl->d_array_owned;
310bd882c8aSJames Wright     } else if (impl->h_array_owned) {
311bd882c8aSJames Wright       impl->h_array = impl->h_array_owned;
312bd882c8aSJames Wright     } else {
313bd882c8aSJames Wright       CeedCallBackend(CeedVectorSetArray(vec, CEED_MEM_DEVICE, CEED_COPY_VALUES, NULL));
314bd882c8aSJames Wright     }
315bd882c8aSJames Wright   }
316bd882c8aSJames Wright   if (impl->d_array) {
317bd882c8aSJames Wright     CeedCallBackend(CeedDeviceSetValue_Sycl(data->sycl_queue, impl->d_array, length, val));
318bd882c8aSJames Wright     impl->h_array = NULL;
319bd882c8aSJames Wright   }
320bd882c8aSJames Wright   if (impl->h_array) {
321bd882c8aSJames Wright     CeedCallBackend(CeedHostSetValue_Sycl(impl->h_array, length, val));
322bd882c8aSJames Wright     impl->d_array = NULL;
323bd882c8aSJames Wright   }
324bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
325bd882c8aSJames Wright }
326bd882c8aSJames Wright 
327bd882c8aSJames Wright //------------------------------------------------------------------------------
328bd882c8aSJames Wright // Vector Take Array
329bd882c8aSJames Wright //------------------------------------------------------------------------------
330bd882c8aSJames Wright static int CeedVectorTakeArray_Sycl(CeedVector vec, CeedMemType mem_type, CeedScalar **array) {
331bd882c8aSJames Wright   Ceed             ceed;
332bd882c8aSJames Wright   Ceed_Sycl       *data;
333dd64fc84SJeremy L Thompson   CeedVector_Sycl *impl;
334dd64fc84SJeremy L Thompson 
335dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
336dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(vec, &impl));
337bd882c8aSJames Wright   CeedCallBackend(CeedGetData(ceed, &data));
338bd882c8aSJames Wright 
339*1f4b1b45SUmesh Unnikrishnan   // Order queue if needed
340*1f4b1b45SUmesh Unnikrishnan   if (!data->sycl_queue.is_in_order()) data->sycl_queue.ext_oneapi_submit_barrier();
341bd882c8aSJames Wright 
342bd882c8aSJames Wright   // Sync array to requested mem_type
343bd882c8aSJames Wright   CeedCallBackend(CeedVectorSyncArray(vec, mem_type));
344bd882c8aSJames Wright 
345bd882c8aSJames Wright   // Update pointer
346bd882c8aSJames Wright   switch (mem_type) {
347bd882c8aSJames Wright     case CEED_MEM_HOST:
348bd882c8aSJames Wright       (*array)               = impl->h_array_borrowed;
349bd882c8aSJames Wright       impl->h_array_borrowed = NULL;
350bd882c8aSJames Wright       impl->h_array          = NULL;
351bd882c8aSJames Wright       break;
352bd882c8aSJames Wright     case CEED_MEM_DEVICE:
353bd882c8aSJames Wright       (*array)               = impl->d_array_borrowed;
354bd882c8aSJames Wright       impl->d_array_borrowed = NULL;
355bd882c8aSJames Wright       impl->d_array          = NULL;
356bd882c8aSJames Wright       break;
357bd882c8aSJames Wright   }
358bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
359bd882c8aSJames Wright }
360bd882c8aSJames Wright 
361bd882c8aSJames Wright //------------------------------------------------------------------------------
362bd882c8aSJames Wright // Core logic for array syncronization for GetArray.
363bd882c8aSJames Wright //   If a different memory type is most up to date, this will perform a copy
364bd882c8aSJames Wright //------------------------------------------------------------------------------
365bd882c8aSJames Wright static int CeedVectorGetArrayCore_Sycl(const CeedVector vec, const CeedMemType mem_type, CeedScalar **array) {
366bd882c8aSJames Wright   CeedVector_Sycl *impl;
367dd64fc84SJeremy L Thompson 
368bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetData(vec, &impl));
369bd882c8aSJames Wright 
370bd882c8aSJames Wright   // Sync array to requested mem_type
371bd882c8aSJames Wright   CeedCallBackend(CeedVectorSyncArray(vec, mem_type));
372bd882c8aSJames Wright 
373bd882c8aSJames Wright   // Update pointer
374bd882c8aSJames Wright   switch (mem_type) {
375bd882c8aSJames Wright     case CEED_MEM_HOST:
376bd882c8aSJames Wright       *array = impl->h_array;
377bd882c8aSJames Wright       break;
378bd882c8aSJames Wright     case CEED_MEM_DEVICE:
379bd882c8aSJames Wright       *array = impl->d_array;
380bd882c8aSJames Wright       break;
381bd882c8aSJames Wright   }
382bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
383bd882c8aSJames Wright }
384ff1e7120SSebastian Grimberg 
385bd882c8aSJames Wright //------------------------------------------------------------------------------
386bd882c8aSJames Wright // Get read-only access to a vector via the specified mem_type
387bd882c8aSJames Wright //------------------------------------------------------------------------------
388bd882c8aSJames Wright static int CeedVectorGetArrayRead_Sycl(const CeedVector vec, const CeedMemType mem_type, const CeedScalar **array) {
389bd882c8aSJames Wright   return CeedVectorGetArrayCore_Sycl(vec, mem_type, (CeedScalar **)array);
390bd882c8aSJames Wright }
391bd882c8aSJames Wright 
392bd882c8aSJames Wright //------------------------------------------------------------------------------
393bd882c8aSJames Wright // Get read/write access to a vector via the specified mem_type
394bd882c8aSJames Wright //------------------------------------------------------------------------------
395bd882c8aSJames Wright static int CeedVectorGetArray_Sycl(const CeedVector vec, const CeedMemType mem_type, CeedScalar **array) {
396bd882c8aSJames Wright   CeedVector_Sycl *impl;
397dd64fc84SJeremy L Thompson 
398bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetData(vec, &impl));
399bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetArrayCore_Sycl(vec, mem_type, array));
400bd882c8aSJames Wright   CeedCallBackend(CeedVectorSetAllInvalid_Sycl(vec));
401bd882c8aSJames Wright   switch (mem_type) {
402bd882c8aSJames Wright     case CEED_MEM_HOST:
403bd882c8aSJames Wright       impl->h_array = *array;
404bd882c8aSJames Wright       break;
405bd882c8aSJames Wright     case CEED_MEM_DEVICE:
406bd882c8aSJames Wright       impl->d_array = *array;
407bd882c8aSJames Wright       break;
408bd882c8aSJames Wright   }
409bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
410bd882c8aSJames Wright }
411bd882c8aSJames Wright 
412bd882c8aSJames Wright //------------------------------------------------------------------------------
413bd882c8aSJames Wright // Get write access to a vector via the specified mem_type
414bd882c8aSJames Wright //------------------------------------------------------------------------------
415bd882c8aSJames Wright static int CeedVectorGetArrayWrite_Sycl(const CeedVector vec, const CeedMemType mem_type, CeedScalar **array) {
416bd882c8aSJames Wright   bool             has_array_of_type = true;
417dd64fc84SJeremy L Thompson   CeedVector_Sycl *impl;
418dd64fc84SJeremy L Thompson 
419dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(vec, &impl));
420bd882c8aSJames Wright   CeedCallBackend(CeedVectorHasArrayOfType_Sycl(vec, mem_type, &has_array_of_type));
421bd882c8aSJames Wright   if (!has_array_of_type) {
422bd882c8aSJames Wright     // Allocate if array is not yet allocated
423bd882c8aSJames Wright     CeedCallBackend(CeedVectorSetArray(vec, mem_type, CEED_COPY_VALUES, NULL));
424bd882c8aSJames Wright   } else {
425bd882c8aSJames Wright     // Select dirty array
426bd882c8aSJames Wright     switch (mem_type) {
427bd882c8aSJames Wright       case CEED_MEM_HOST:
428bd882c8aSJames Wright         if (impl->h_array_borrowed) impl->h_array = impl->h_array_borrowed;
429bd882c8aSJames Wright         else impl->h_array = impl->h_array_owned;
430bd882c8aSJames Wright         break;
431bd882c8aSJames Wright       case CEED_MEM_DEVICE:
432bd882c8aSJames Wright         if (impl->d_array_borrowed) impl->d_array = impl->d_array_borrowed;
433bd882c8aSJames Wright         else impl->d_array = impl->d_array_owned;
434bd882c8aSJames Wright     }
435bd882c8aSJames Wright   }
436bd882c8aSJames Wright   return CeedVectorGetArray_Sycl(vec, mem_type, array);
437bd882c8aSJames Wright }
438bd882c8aSJames Wright 
439bd882c8aSJames Wright //------------------------------------------------------------------------------
440bd882c8aSJames Wright // Get the norm of a CeedVector
441bd882c8aSJames Wright //------------------------------------------------------------------------------
442bd882c8aSJames Wright static int CeedVectorNorm_Sycl(CeedVector vec, CeedNormType type, CeedScalar *norm) {
443bd882c8aSJames Wright   Ceed              ceed;
444bd882c8aSJames Wright   Ceed_Sycl        *data;
445dd64fc84SJeremy L Thompson   CeedSize          length;
446dd64fc84SJeremy L Thompson   const CeedScalar *d_array;
447dd64fc84SJeremy L Thompson   CeedVector_Sycl  *impl;
448dd64fc84SJeremy L Thompson 
449dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
450dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(vec, &impl));
451dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetLength(vec, &length));
452bd882c8aSJames Wright   CeedCallBackend(CeedGetData(ceed, &data));
453bd882c8aSJames Wright 
454bd882c8aSJames Wright   // Compute norm
455bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetArrayRead(vec, CEED_MEM_DEVICE, &d_array));
456*1f4b1b45SUmesh Unnikrishnan 
457*1f4b1b45SUmesh Unnikrishnan   std::vector<sycl::event> e;
458*1f4b1b45SUmesh Unnikrishnan 
459*1f4b1b45SUmesh Unnikrishnan   if (!data->sycl_queue.is_in_order()) e = {data->sycl_queue.ext_oneapi_submit_barrier()};
460*1f4b1b45SUmesh Unnikrishnan 
461bd882c8aSJames Wright   switch (type) {
462bd882c8aSJames Wright     case CEED_NORM_1: {
463bd882c8aSJames Wright       // Order queue
464bd882c8aSJames Wright       auto sumReduction = sycl::reduction(impl->reduction_norm, sycl::plus<>(), {sycl::property::reduction::initialize_to_identity{}});
465*1f4b1b45SUmesh Unnikrishnan       data->sycl_queue.parallel_for(length, e, sumReduction, [=](sycl::id<1> i, auto &sum) { sum += abs(d_array[i]); }).wait_and_throw();
466bd882c8aSJames Wright     } break;
467bd882c8aSJames Wright     case CEED_NORM_2: {
468bd882c8aSJames Wright       // Order queue
469bd882c8aSJames Wright       auto sumReduction = sycl::reduction(impl->reduction_norm, sycl::plus<>(), {sycl::property::reduction::initialize_to_identity{}});
470*1f4b1b45SUmesh Unnikrishnan       data->sycl_queue.parallel_for(length, e, sumReduction, [=](sycl::id<1> i, auto &sum) { sum += (d_array[i] * d_array[i]); }).wait_and_throw();
471bd882c8aSJames Wright     } break;
472bd882c8aSJames Wright     case CEED_NORM_MAX: {
473bd882c8aSJames Wright       // Order queue
474bd882c8aSJames Wright       auto maxReduction = sycl::reduction(impl->reduction_norm, sycl::maximum<>(), {sycl::property::reduction::initialize_to_identity{}});
475*1f4b1b45SUmesh Unnikrishnan       data->sycl_queue.parallel_for(length, e, maxReduction, [=](sycl::id<1> i, auto &max) { max.combine(abs(d_array[i])); }).wait_and_throw();
476bd882c8aSJames Wright     } break;
477bd882c8aSJames Wright   }
478bd882c8aSJames Wright   // L2 norm - square root over reduced value
479bd882c8aSJames Wright   if (type == CEED_NORM_2) *norm = sqrt(*impl->reduction_norm);
480bd882c8aSJames Wright   else *norm = *impl->reduction_norm;
481bd882c8aSJames Wright   CeedCallBackend(CeedVectorRestoreArrayRead(vec, &d_array));
482bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
483bd882c8aSJames Wright }
484bd882c8aSJames Wright 
485bd882c8aSJames Wright //------------------------------------------------------------------------------
486bd882c8aSJames Wright // Take reciprocal of a vector on host
487bd882c8aSJames Wright //------------------------------------------------------------------------------
4886ca0f394SUmesh Unnikrishnan static int CeedHostReciprocal_Sycl(CeedScalar *h_array, CeedSize length) {
4896ca0f394SUmesh Unnikrishnan   for (CeedSize i = 0; i < length; i++) {
490bd882c8aSJames Wright     if (std::fabs(h_array[i]) > CEED_EPSILON) h_array[i] = 1. / h_array[i];
491bd882c8aSJames Wright   }
492bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
493bd882c8aSJames Wright }
494bd882c8aSJames Wright 
495bd882c8aSJames Wright //------------------------------------------------------------------------------
496bd882c8aSJames Wright // Take reciprocal of a vector on device
497bd882c8aSJames Wright //------------------------------------------------------------------------------
4986ca0f394SUmesh Unnikrishnan static int CeedDeviceReciprocal_Sycl(sycl::queue &sycl_queue, CeedScalar *d_array, CeedSize length) {
499*1f4b1b45SUmesh Unnikrishnan   std::vector<sycl::event> e;
500*1f4b1b45SUmesh Unnikrishnan 
501*1f4b1b45SUmesh Unnikrishnan   if (!sycl_queue.is_in_order()) e = {sycl_queue.ext_oneapi_submit_barrier()};
502*1f4b1b45SUmesh Unnikrishnan   sycl_queue.parallel_for(length, e, [=](sycl::id<1> i) {
503bd882c8aSJames Wright     if (std::fabs(d_array[i]) > CEED_EPSILON) d_array[i] = 1. / d_array[i];
504bd882c8aSJames Wright   });
505bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
506bd882c8aSJames Wright }
507bd882c8aSJames Wright 
508bd882c8aSJames Wright //------------------------------------------------------------------------------
509bd882c8aSJames Wright // Take reciprocal of a vector
510bd882c8aSJames Wright //------------------------------------------------------------------------------
511bd882c8aSJames Wright static int CeedVectorReciprocal_Sycl(CeedVector vec) {
512bd882c8aSJames Wright   Ceed             ceed;
513bd882c8aSJames Wright   Ceed_Sycl       *data;
514dd64fc84SJeremy L Thompson   CeedSize         length;
515dd64fc84SJeremy L Thompson   CeedVector_Sycl *impl;
516dd64fc84SJeremy L Thompson 
517dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
518dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(vec, &impl));
519dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetLength(vec, &length));
520bd882c8aSJames Wright   CeedCallBackend(CeedGetData(ceed, &data));
521bd882c8aSJames Wright 
522bd882c8aSJames Wright   // Set value for synced device/host array
523bd882c8aSJames Wright   if (impl->d_array) CeedCallBackend(CeedDeviceReciprocal_Sycl(data->sycl_queue, impl->d_array, length));
524bd882c8aSJames Wright   if (impl->h_array) CeedCallBackend(CeedHostReciprocal_Sycl(impl->h_array, length));
525bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
526bd882c8aSJames Wright }
527bd882c8aSJames Wright 
528bd882c8aSJames Wright //------------------------------------------------------------------------------
529bd882c8aSJames Wright // Compute x = alpha x on the host
530bd882c8aSJames Wright //------------------------------------------------------------------------------
5316ca0f394SUmesh Unnikrishnan static int CeedHostScale_Sycl(CeedScalar *x_array, CeedScalar alpha, CeedSize length) {
5326ca0f394SUmesh Unnikrishnan   for (CeedSize i = 0; i < length; i++) x_array[i] *= alpha;
533bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
534bd882c8aSJames Wright }
535bd882c8aSJames Wright 
536bd882c8aSJames Wright //------------------------------------------------------------------------------
537bd882c8aSJames Wright // Compute x = alpha x on device
538bd882c8aSJames Wright //------------------------------------------------------------------------------
5396ca0f394SUmesh Unnikrishnan static int CeedDeviceScale_Sycl(sycl::queue &sycl_queue, CeedScalar *x_array, CeedScalar alpha, CeedSize length) {
540*1f4b1b45SUmesh Unnikrishnan   std::vector<sycl::event> e;
541*1f4b1b45SUmesh Unnikrishnan 
542*1f4b1b45SUmesh Unnikrishnan   if (!sycl_queue.is_in_order()) e = {sycl_queue.ext_oneapi_submit_barrier()};
543*1f4b1b45SUmesh Unnikrishnan   sycl_queue.parallel_for(length, e, [=](sycl::id<1> i) { x_array[i] *= alpha; });
544bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
545bd882c8aSJames Wright }
546bd882c8aSJames Wright 
547bd882c8aSJames Wright //------------------------------------------------------------------------------
548bd882c8aSJames Wright // Compute x = alpha x
549bd882c8aSJames Wright //------------------------------------------------------------------------------
550bd882c8aSJames Wright static int CeedVectorScale_Sycl(CeedVector x, CeedScalar alpha) {
551bd882c8aSJames Wright   Ceed             ceed;
552bd882c8aSJames Wright   Ceed_Sycl       *data;
553dd64fc84SJeremy L Thompson   CeedSize         length;
554dd64fc84SJeremy L Thompson   CeedVector_Sycl *x_impl;
555dd64fc84SJeremy L Thompson 
556dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetCeed(x, &ceed));
557dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(x, &x_impl));
558dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetLength(x, &length));
559bd882c8aSJames Wright   CeedCallBackend(CeedGetData(ceed, &data));
560bd882c8aSJames Wright 
561bd882c8aSJames Wright   // Set value for synced device/host array
562bd882c8aSJames Wright   if (x_impl->d_array) CeedCallBackend(CeedDeviceScale_Sycl(data->sycl_queue, x_impl->d_array, alpha, length));
563bd882c8aSJames Wright   if (x_impl->h_array) CeedCallBackend(CeedHostScale_Sycl(x_impl->h_array, alpha, length));
564bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
565bd882c8aSJames Wright }
566bd882c8aSJames Wright 
567bd882c8aSJames Wright //------------------------------------------------------------------------------
568bd882c8aSJames Wright // Compute y = alpha x + y on the host
569bd882c8aSJames Wright //------------------------------------------------------------------------------
5706ca0f394SUmesh Unnikrishnan static int CeedHostAXPY_Sycl(CeedScalar *y_array, CeedScalar alpha, CeedScalar *x_array, CeedSize length) {
5716ca0f394SUmesh Unnikrishnan   for (CeedSize i = 0; i < length; i++) y_array[i] += alpha * x_array[i];
572bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
573bd882c8aSJames Wright }
574bd882c8aSJames Wright 
575bd882c8aSJames Wright //------------------------------------------------------------------------------
576bd882c8aSJames Wright // Compute y = alpha x + y on device
577bd882c8aSJames Wright //------------------------------------------------------------------------------
5786ca0f394SUmesh Unnikrishnan static int CeedDeviceAXPY_Sycl(sycl::queue &sycl_queue, CeedScalar *y_array, CeedScalar alpha, CeedScalar *x_array, CeedSize length) {
579*1f4b1b45SUmesh Unnikrishnan   std::vector<sycl::event> e;
580*1f4b1b45SUmesh Unnikrishnan 
581*1f4b1b45SUmesh Unnikrishnan   if (!sycl_queue.is_in_order()) e = {sycl_queue.ext_oneapi_submit_barrier()};
582*1f4b1b45SUmesh Unnikrishnan   sycl_queue.parallel_for(length, e, [=](sycl::id<1> i) { y_array[i] += alpha * x_array[i]; });
583bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
584bd882c8aSJames Wright }
585bd882c8aSJames Wright 
586bd882c8aSJames Wright //------------------------------------------------------------------------------
587bd882c8aSJames Wright // Compute y = alpha x + y
588bd882c8aSJames Wright //------------------------------------------------------------------------------
589bd882c8aSJames Wright static int CeedVectorAXPY_Sycl(CeedVector y, CeedScalar alpha, CeedVector x) {
590bd882c8aSJames Wright   Ceed             ceed;
591dd64fc84SJeremy L Thompson   Ceed_Sycl       *data;
592dd64fc84SJeremy L Thompson   CeedSize         length;
593bd882c8aSJames Wright   CeedVector_Sycl *y_impl, *x_impl;
594dd64fc84SJeremy L Thompson 
595dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetCeed(y, &ceed));
596bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetData(y, &y_impl));
597bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetData(x, &x_impl));
598bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetLength(y, &length));
599bd882c8aSJames Wright   CeedCallBackend(CeedGetData(ceed, &data));
600bd882c8aSJames Wright 
601bd882c8aSJames Wright   // Set value for synced device/host array
602bd882c8aSJames Wright   if (y_impl->d_array) {
603bd882c8aSJames Wright     CeedCallBackend(CeedVectorSyncArray(x, CEED_MEM_DEVICE));
604bd882c8aSJames Wright     CeedCallBackend(CeedDeviceAXPY_Sycl(data->sycl_queue, y_impl->d_array, alpha, x_impl->d_array, length));
605bd882c8aSJames Wright   }
606bd882c8aSJames Wright   if (y_impl->h_array) {
607bd882c8aSJames Wright     CeedCallBackend(CeedVectorSyncArray(x, CEED_MEM_HOST));
608bd882c8aSJames Wright     CeedCallBackend(CeedHostAXPY_Sycl(y_impl->h_array, alpha, x_impl->h_array, length));
609bd882c8aSJames Wright   }
610bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
611bd882c8aSJames Wright }
612bd882c8aSJames Wright 
613bd882c8aSJames Wright //------------------------------------------------------------------------------
614bd882c8aSJames Wright // Compute the pointwise multiplication w = x .* y on the host
615bd882c8aSJames Wright //------------------------------------------------------------------------------
6166ca0f394SUmesh Unnikrishnan static int CeedHostPointwiseMult_Sycl(CeedScalar *w_array, CeedScalar *x_array, CeedScalar *y_array, CeedSize length) {
6176ca0f394SUmesh Unnikrishnan   for (CeedSize i = 0; i < length; i++) w_array[i] = x_array[i] * y_array[i];
618bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
619bd882c8aSJames Wright }
620bd882c8aSJames Wright 
621bd882c8aSJames Wright //------------------------------------------------------------------------------
622bd882c8aSJames Wright // Compute the pointwise multiplication w = x .* y on device (impl in .cu file)
623bd882c8aSJames Wright //------------------------------------------------------------------------------
6246ca0f394SUmesh Unnikrishnan static int CeedDevicePointwiseMult_Sycl(sycl::queue &sycl_queue, CeedScalar *w_array, CeedScalar *x_array, CeedScalar *y_array, CeedSize length) {
625*1f4b1b45SUmesh Unnikrishnan   std::vector<sycl::event> e;
626*1f4b1b45SUmesh Unnikrishnan 
627*1f4b1b45SUmesh Unnikrishnan   if (!sycl_queue.is_in_order()) e = {sycl_queue.ext_oneapi_submit_barrier()};
628*1f4b1b45SUmesh Unnikrishnan   sycl_queue.parallel_for(length, e, [=](sycl::id<1> i) { w_array[i] = x_array[i] * y_array[i]; });
629bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
630bd882c8aSJames Wright }
631bd882c8aSJames Wright 
632bd882c8aSJames Wright //------------------------------------------------------------------------------
633bd882c8aSJames Wright // Compute the pointwise multiplication w = x .* y
634bd882c8aSJames Wright //------------------------------------------------------------------------------
635bd882c8aSJames Wright static int CeedVectorPointwiseMult_Sycl(CeedVector w, CeedVector x, CeedVector y) {
636bd882c8aSJames Wright   Ceed             ceed;
637dd64fc84SJeremy L Thompson   Ceed_Sycl       *data;
638dd64fc84SJeremy L Thompson   CeedSize         length;
639bd882c8aSJames Wright   CeedVector_Sycl *w_impl, *x_impl, *y_impl;
640dd64fc84SJeremy L Thompson 
641dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetCeed(w, &ceed));
642bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetData(w, &w_impl));
643bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetData(x, &x_impl));
644bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetData(y, &y_impl));
645bd882c8aSJames Wright   CeedCallBackend(CeedVectorGetLength(w, &length));
646bd882c8aSJames Wright   CeedCallBackend(CeedGetData(ceed, &data));
647bd882c8aSJames Wright 
648bd882c8aSJames Wright   // Set value for synced device/host array
649bd882c8aSJames Wright   if (!w_impl->d_array && !w_impl->h_array) {
650bd882c8aSJames Wright     CeedCallBackend(CeedVectorSetValue(w, 0.0));
651bd882c8aSJames Wright   }
652bd882c8aSJames Wright   if (w_impl->d_array) {
653bd882c8aSJames Wright     CeedCallBackend(CeedVectorSyncArray(x, CEED_MEM_DEVICE));
654bd882c8aSJames Wright     CeedCallBackend(CeedVectorSyncArray(y, CEED_MEM_DEVICE));
655bd882c8aSJames Wright     CeedCallBackend(CeedDevicePointwiseMult_Sycl(data->sycl_queue, w_impl->d_array, x_impl->d_array, y_impl->d_array, length));
656bd882c8aSJames Wright   }
657bd882c8aSJames Wright   if (w_impl->h_array) {
658bd882c8aSJames Wright     CeedCallBackend(CeedVectorSyncArray(x, CEED_MEM_HOST));
659bd882c8aSJames Wright     CeedCallBackend(CeedVectorSyncArray(y, CEED_MEM_HOST));
660bd882c8aSJames Wright     CeedCallBackend(CeedHostPointwiseMult_Sycl(w_impl->h_array, x_impl->h_array, y_impl->h_array, length));
661bd882c8aSJames Wright   }
662bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
663bd882c8aSJames Wright }
664bd882c8aSJames Wright 
665bd882c8aSJames Wright //------------------------------------------------------------------------------
666bd882c8aSJames Wright // Destroy the vector
667bd882c8aSJames Wright //------------------------------------------------------------------------------
668bd882c8aSJames Wright static int CeedVectorDestroy_Sycl(const CeedVector vec) {
669bd882c8aSJames Wright   Ceed             ceed;
670bd882c8aSJames Wright   Ceed_Sycl       *data;
671dd64fc84SJeremy L Thompson   CeedVector_Sycl *impl;
672dd64fc84SJeremy L Thompson 
673dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
674dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetData(vec, &impl));
675bd882c8aSJames Wright   CeedCallBackend(CeedGetData(ceed, &data));
676bd882c8aSJames Wright 
677bd882c8aSJames Wright   // Wait for all work to finish before freeing memory
678bd882c8aSJames Wright   CeedCallSycl(ceed, data->sycl_queue.wait_and_throw());
679bd882c8aSJames Wright   CeedCallSycl(ceed, sycl::free(impl->d_array_owned, data->sycl_context));
680bd882c8aSJames Wright   CeedCallSycl(ceed, sycl::free(impl->reduction_norm, data->sycl_context));
681bd882c8aSJames Wright 
682bd882c8aSJames Wright   CeedCallBackend(CeedFree(&impl->h_array_owned));
683bd882c8aSJames Wright   CeedCallBackend(CeedFree(&impl));
684bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
685bd882c8aSJames Wright }
686bd882c8aSJames Wright 
687bd882c8aSJames Wright //------------------------------------------------------------------------------
688bd882c8aSJames Wright // Create a vector of the specified length (does not allocate memory)
689bd882c8aSJames Wright //------------------------------------------------------------------------------
690bd882c8aSJames Wright int CeedVectorCreate_Sycl(CeedSize n, CeedVector vec) {
691bd882c8aSJames Wright   Ceed             ceed;
692bd882c8aSJames Wright   Ceed_Sycl       *data;
693dd64fc84SJeremy L Thompson   CeedVector_Sycl *impl;
694bd882c8aSJames Wright 
695dd64fc84SJeremy L Thompson   CeedCallBackend(CeedVectorGetCeed(vec, &ceed));
696dd64fc84SJeremy L Thompson   CeedCallBackend(CeedGetData(ceed, &data));
697bd882c8aSJames Wright   CeedCallBackend(CeedCalloc(1, &impl));
698bd882c8aSJames Wright   CeedCallSycl(ceed, impl->reduction_norm = sycl::malloc_host<CeedScalar>(1, data->sycl_context));
699bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "HasValidArray", CeedVectorHasValidArray_Sycl));
700bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "HasBorrowedArrayOfType", CeedVectorHasBorrowedArrayOfType_Sycl));
701bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "SetArray", CeedVectorSetArray_Sycl));
702bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "TakeArray", CeedVectorTakeArray_Sycl));
703bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "SetValue", CeedVectorSetValue_Sycl));
704bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "SyncArray", CeedVectorSyncArray_Sycl));
705bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "GetArray", CeedVectorGetArray_Sycl));
706bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "GetArrayRead", CeedVectorGetArrayRead_Sycl));
707bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "GetArrayWrite", CeedVectorGetArrayWrite_Sycl));
708bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "Norm", CeedVectorNorm_Sycl));
709bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "Reciprocal", CeedVectorReciprocal_Sycl));
710bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "AXPY", CeedVectorAXPY_Sycl));
711bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "Scale", CeedVectorScale_Sycl));
712bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "PointwiseMult", CeedVectorPointwiseMult_Sycl));
713bd882c8aSJames Wright   CeedCallBackend(CeedSetBackendFunctionCpp(ceed, "Vector", vec, "Destroy", CeedVectorDestroy_Sycl));
714bd882c8aSJames Wright   CeedCallBackend(CeedVectorSetData(vec, impl));
715bd882c8aSJames Wright   return CEED_ERROR_SUCCESS;
716bd882c8aSJames Wright }
717