Lines Matching refs:elem_size
21 … const CeedInt elem_size, CeedSize v_offset, const CeedScalar *__restrict__ uu, in CeedElemRestrictionApplyStridedNoTranspose_Ref_Core() argument
32 for (CeedSize n = 0; n < elem_size; n++) { in CeedElemRestrictionApplyStridedNoTranspose_Ref_Core()
34 vv[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset] = in CeedElemRestrictionApplyStridedNoTranspose_Ref_Core()
35 … uu[n + k * elem_size + CeedIntMin(e + j, num_elem - 1) * elem_size * (CeedSize)num_comp]; in CeedElemRestrictionApplyStridedNoTranspose_Ref_Core()
47 for (CeedSize n = 0; n < elem_size; n++) { in CeedElemRestrictionApplyStridedNoTranspose_Ref_Core()
49 vv[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset] = in CeedElemRestrictionApplyStridedNoTranspose_Ref_Core()
61 … const CeedInt num_elem, const CeedInt elem_size, const CeedSize v_offset, in CeedElemRestrictionApplyOffsetNoTranspose_Ref_Core() argument
69 CeedPragmaSIMD for (CeedSize i = 0; i < elem_size * block_size; i++) { in CeedElemRestrictionApplyOffsetNoTranspose_Ref_Core()
70 …vv[elem_size * (k * block_size + e * num_comp) + i - v_offset] = uu[impl->offsets[i + e * elem_siz… in CeedElemRestrictionApplyOffsetNoTranspose_Ref_Core()
79 … const CeedInt num_elem, const CeedInt elem_size, const CeedSize v_offset, in CeedElemRestrictionApplyOrientedNoTranspose_Ref_Core() argument
87 CeedPragmaSIMD for (CeedSize i = 0; i < elem_size * block_size; i++) { in CeedElemRestrictionApplyOrientedNoTranspose_Ref_Core()
88 vv[elem_size * (k * block_size + e * num_comp) + i - v_offset] = in CeedElemRestrictionApplyOrientedNoTranspose_Ref_Core()
89 …uu[impl->offsets[i + e * elem_size] + k * comp_stride] * (impl->orients[i + e * elem_size] ? -1.0 … in CeedElemRestrictionApplyOrientedNoTranspose_Ref_Core()
98 … const CeedInt num_elem, const CeedInt elem_size, const CeedSize v_offset, in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core() argument
109 vv[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset] = in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
110 uu[impl->offsets[j + n * block_size + e * elem_size] + k * comp_stride] * in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
111 impl->curl_orients[j + (3 * n + 1) * block_size + e * 3 * elem_size] + in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
112 uu[impl->offsets[j + (n + 1) * block_size + e * elem_size] + k * comp_stride] * in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
113 impl->curl_orients[j + (3 * n + 2) * block_size + e * 3 * elem_size]; in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
115 for (n = 1; n < elem_size - 1; n++) { in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
117 vv[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset] = in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
118 uu[impl->offsets[j + (n - 1) * block_size + e * elem_size] + k * comp_stride] * in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
119 impl->curl_orients[j + (3 * n + 0) * block_size + e * 3 * elem_size] + in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
120 uu[impl->offsets[j + n * block_size + e * elem_size] + k * comp_stride] * in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
121 impl->curl_orients[j + (3 * n + 1) * block_size + e * 3 * elem_size] + in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
122 uu[impl->offsets[j + (n + 1) * block_size + e * elem_size] + k * comp_stride] * in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
123 impl->curl_orients[j + (3 * n + 2) * block_size + e * 3 * elem_size]; in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
127 vv[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset] = in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
128 uu[impl->offsets[j + (n - 1) * block_size + e * elem_size] + k * comp_stride] * in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
129 impl->curl_orients[j + (3 * n + 0) * block_size + e * 3 * elem_size] + in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
130 uu[impl->offsets[j + n * block_size + e * elem_size] + k * comp_stride] * in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
131 impl->curl_orients[j + (3 * n + 1) * block_size + e * 3 * elem_size]; in CeedElemRestrictionApplyCurlOrientedNoTranspose_Ref_Core()
141 … const CeedInt elem_size, const CeedSize v_offset, in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core() argument
152 vv[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset] = in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
153 uu[impl->offsets[j + n * block_size + e * elem_size] + k * comp_stride] * in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
154 abs(impl->curl_orients[j + (3 * n + 1) * block_size + e * 3 * elem_size]) + in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
155 uu[impl->offsets[j + (n + 1) * block_size + e * elem_size] + k * comp_stride] * in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
156 abs(impl->curl_orients[j + (3 * n + 2) * block_size + e * 3 * elem_size]); in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
158 for (n = 1; n < elem_size - 1; n++) { in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
160 vv[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset] = in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
161 uu[impl->offsets[j + (n - 1) * block_size + e * elem_size] + k * comp_stride] * in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
162 abs(impl->curl_orients[j + (3 * n + 0) * block_size + e * 3 * elem_size]) + in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
163 uu[impl->offsets[j + n * block_size + e * elem_size] + k * comp_stride] * in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
164 abs(impl->curl_orients[j + (3 * n + 1) * block_size + e * 3 * elem_size]) + in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
165 uu[impl->offsets[j + (n + 1) * block_size + e * elem_size] + k * comp_stride] * in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
166 abs(impl->curl_orients[j + (3 * n + 2) * block_size + e * 3 * elem_size]); in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
170 vv[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset] = in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
171 uu[impl->offsets[j + (n - 1) * block_size + e * elem_size] + k * comp_stride] * in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
172 abs(impl->curl_orients[j + (3 * n + 0) * block_size + e * 3 * elem_size]) + in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
173 uu[impl->offsets[j + n * block_size + e * elem_size] + k * comp_stride] * in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
174 abs(impl->curl_orients[j + (3 * n + 1) * block_size + e * 3 * elem_size]); in CeedElemRestrictionApplyCurlOrientedUnsignedNoTranspose_Ref_Core()
183 … const CeedInt elem_size, const CeedSize v_offset, in CeedElemRestrictionApplyStridedTranspose_Ref_Core() argument
194 for (CeedSize n = 0; n < elem_size; n++) { in CeedElemRestrictionApplyStridedTranspose_Ref_Core()
196 …vv[n + k * elem_size + (e + j) * elem_size * num_comp] += uu[e * elem_size * num_comp + (k * elem_… in CeedElemRestrictionApplyStridedTranspose_Ref_Core()
208 for (CeedSize n = 0; n < elem_size; n++) { in CeedElemRestrictionApplyStridedTranspose_Ref_Core()
211 uu[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset]; in CeedElemRestrictionApplyStridedTranspose_Ref_Core()
222 … const CeedInt num_elem, const CeedInt elem_size, const CeedSize v_offset, in CeedElemRestrictionApplyOffsetTranspose_Ref_Core() argument
230 for (CeedSize i = 0; i < elem_size * block_size; i += block_size) { in CeedElemRestrictionApplyOffsetTranspose_Ref_Core()
235 vv_loc = uu[elem_size * (k * block_size + e * num_comp) + j - v_offset]; in CeedElemRestrictionApplyOffsetTranspose_Ref_Core()
236 CeedPragmaAtomic vv[impl->offsets[j + e * elem_size] + k * comp_stride] += vv_loc; in CeedElemRestrictionApplyOffsetTranspose_Ref_Core()
246 … const CeedInt num_elem, const CeedInt elem_size, const CeedSize v_offset, in CeedElemRestrictionApplyOrientedTranspose_Ref_Core() argument
254 for (CeedSize i = 0; i < elem_size * block_size; i += block_size) { in CeedElemRestrictionApplyOrientedTranspose_Ref_Core()
259 …vv_loc = uu[elem_size * (k * block_size + e * num_comp) + j - v_offset] * (impl->orients[j + e * e… in CeedElemRestrictionApplyOrientedTranspose_Ref_Core()
260 CeedPragmaAtomic vv[impl->offsets[j + e * elem_size] + k * comp_stride] += vv_loc; in CeedElemRestrictionApplyOrientedTranspose_Ref_Core()
270 … const CeedInt num_elem, const CeedInt elem_size, const CeedSize v_offset, in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core() argument
284 vv_loc[j] = uu[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset] * in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
285 impl->curl_orients[j + (3 * n + 1) * block_size + e * 3 * elem_size] + in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
286 … uu[e * elem_size * num_comp + (k * elem_size + n + 1) * block_size + j - v_offset] * in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
287 impl->curl_orients[j + (3 * n + 3) * block_size + e * 3 * elem_size]; in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
290 …CeedPragmaAtomic vv[impl->offsets[j + n * block_size + e * elem_size] + k * comp_stride] += vv_loc… in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
292 for (n = 1; n < elem_size - 1; n++) { in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
294 … vv_loc[j] = uu[e * elem_size * num_comp + (k * elem_size + n - 1) * block_size + j - v_offset] * in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
295 impl->curl_orients[j + (3 * n - 1) * block_size + e * 3 * elem_size] + in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
296 … uu[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset] * in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
297 impl->curl_orients[j + (3 * n + 1) * block_size + e * 3 * elem_size] + in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
298 … uu[e * elem_size * num_comp + (k * elem_size + n + 1) * block_size + j - v_offset] * in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
299 impl->curl_orients[j + (3 * n + 3) * block_size + e * 3 * elem_size]; in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
302 …CeedPragmaAtomic vv[impl->offsets[j + n * block_size + e * elem_size] + k * comp_stride] += vv_loc… in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
306 … vv_loc[j] = uu[e * elem_size * num_comp + (k * elem_size + n - 1) * block_size + j - v_offset] * in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
307 impl->curl_orients[j + (3 * n - 1) * block_size + e * 3 * elem_size] + in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
308 uu[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset] * in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
309 impl->curl_orients[j + (3 * n + 1) * block_size + e * 3 * elem_size]; in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
312 …CeedPragmaAtomic vv[impl->offsets[j + n * block_size + e * elem_size] + k * comp_stride] += vv_loc… in CeedElemRestrictionApplyCurlOrientedTranspose_Ref_Core()
322 … const CeedInt elem_size, const CeedSize v_offset, in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core() argument
336 vv_loc[j] = uu[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset] * in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
337 abs(impl->curl_orients[j + (3 * n + 1) * block_size + e * 3 * elem_size]) + in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
338 … uu[e * elem_size * num_comp + (k * elem_size + n + 1) * block_size + j - v_offset] * in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
339 abs(impl->curl_orients[j + (3 * n + 3) * block_size + e * 3 * elem_size]); in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
342 …CeedPragmaAtomic vv[impl->offsets[j + n * block_size + e * elem_size] + k * comp_stride] += vv_loc… in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
344 for (n = 1; n < elem_size - 1; n++) { in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
346 … vv_loc[j] = uu[e * elem_size * num_comp + (k * elem_size + n - 1) * block_size + j - v_offset] * in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
347 … abs(impl->curl_orients[j + (3 * n - 1) * block_size + e * 3 * elem_size]) + in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
348 … uu[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset] * in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
349 … abs(impl->curl_orients[j + (3 * n + 1) * block_size + e * 3 * elem_size]) + in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
350 … uu[e * elem_size * num_comp + (k * elem_size + n + 1) * block_size + j - v_offset] * in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
351 abs(impl->curl_orients[j + (3 * n + 3) * block_size + e * 3 * elem_size]); in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
354 …CeedPragmaAtomic vv[impl->offsets[j + n * block_size + e * elem_size] + k * comp_stride] += vv_loc… in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
358 … vv_loc[j] = uu[e * elem_size * num_comp + (k * elem_size + n - 1) * block_size + j - v_offset] * in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
359 abs(impl->curl_orients[j + (3 * n - 1) * block_size + e * 3 * elem_size]) + in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
360 uu[e * elem_size * num_comp + (k * elem_size + n) * block_size + j - v_offset] * in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
361 abs(impl->curl_orients[j + (3 * n + 1) * block_size + e * 3 * elem_size]); in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
364 …CeedPragmaAtomic vv[impl->offsets[j + n * block_size + e * elem_size] + k * comp_stride] += vv_loc… in CeedElemRestrictionApplyCurlOrientedUnsignedTranspose_Ref_Core()
399 CeedInt num_elem, elem_size; in CeedElemRestrictionApply_Ref_Core() local
406 CeedCallBackend(CeedElemRestrictionGetElementSize(rstr, &elem_size)); in CeedElemRestrictionApply_Ref_Core()
407 v_offset = start * block_size * elem_size * (CeedSize)num_comp; in CeedElemRestrictionApply_Ref_Core()
426 …ridedTranspose_Ref_Core(rstr, num_comp, block_size, start, stop, num_elem, elem_size, v_offset, uu, in CeedElemRestrictionApply_Ref_Core()
430 …OffsetTranspose_Ref_Core(rstr, num_comp, block_size, comp_stride, start, stop, num_elem, elem_size, in CeedElemRestrictionApply_Ref_Core()
436 … elem_size, v_offset, uu, vv)); in CeedElemRestrictionApply_Ref_Core()
438 …OffsetTranspose_Ref_Core(rstr, num_comp, block_size, comp_stride, start, stop, num_elem, elem_size, in CeedElemRestrictionApply_Ref_Core()
445 … elem_size, v_offset, uu, vv)); in CeedElemRestrictionApply_Ref_Core()
448 … num_elem, elem_size, v_offset, uu, vv)); in CeedElemRestrictionApply_Ref_Core()
450 …OffsetTranspose_Ref_Core(rstr, num_comp, block_size, comp_stride, start, stop, num_elem, elem_size, in CeedElemRestrictionApply_Ref_Core()
466 …StridedNoTranspose_Ref_Core(rstr, num_comp, block_size, start, stop, num_elem, elem_size, v_offset, in CeedElemRestrictionApply_Ref_Core()
470 …fsetNoTranspose_Ref_Core(rstr, num_comp, block_size, comp_stride, start, stop, num_elem, elem_size, in CeedElemRestrictionApply_Ref_Core()
476 … elem_size, v_offset, uu, vv)); in CeedElemRestrictionApply_Ref_Core()
479 … elem_size, v_offset, uu, vv)); in CeedElemRestrictionApply_Ref_Core()
485 … elem_size, v_offset, uu, vv)); in CeedElemRestrictionApply_Ref_Core()
488 … num_elem, elem_size, v_offset, uu, vv)); in CeedElemRestrictionApply_Ref_Core()
491 … elem_size, v_offset, uu, vv)); in CeedElemRestrictionApply_Ref_Core()
749 …CeedInt num_elem, elem_size, num_block, block_size, num_comp, comp_stride, num_po… in CeedElemRestrictionCreate_Ref() local
755 CeedCallBackend(CeedElemRestrictionGetElementSize(rstr, &elem_size)); in CeedElemRestrictionCreate_Ref()
770 CeedInt layout[3] = {1, elem_size, elem_size * num_comp}; in CeedElemRestrictionCreate_Ref()
812 for (CeedInt i = 0; i < num_elem * elem_size; i++) { in CeedElemRestrictionCreate_Ref()
820 …sets = rstr_type == CEED_RESTRICTION_POINTS ? (num_elem + 1 + num_points) : (num_elem * elem_size); in CeedElemRestrictionCreate_Ref()