xref: /honee/qfunctions/utils.h (revision 2a28a40b05596e8676ec98635f0ea5784ed7a63a)
1ae2b091fSJames Wright // SPDX-FileCopyrightText: Copyright (c) 2017-2024, HONEE contributors.
2ae2b091fSJames Wright // SPDX-License-Identifier: Apache-2.0 OR BSD-2-Clause
3c7ece6efSJeremy L Thompson #pragma once
4704b8bbeSJames Wright 
53e17a7a1SJames Wright #include <ceed/types.h>
63e17a7a1SJames Wright #ifndef CEED_RUNNING_JIT_PASS
7d0cce58aSJeremy L Thompson #include <math.h>
83e17a7a1SJames Wright #endif
9704b8bbeSJames Wright 
10704b8bbeSJames Wright #ifndef M_PI
11704b8bbeSJames Wright #define M_PI 3.14159265358979323846
12704b8bbeSJames Wright #endif
13704b8bbeSJames Wright 
14704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Max(CeedScalar a, CeedScalar b) { return a < b ? b : a; }
15704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Min(CeedScalar a, CeedScalar b) { return a < b ? a : b; }
16704b8bbeSJames Wright 
17bfa7851aSJames Wright CEED_QFUNCTION_HELPER void SwapScalar(CeedScalar *a, CeedScalar *b) {
18bfa7851aSJames Wright   CeedScalar temp = *a;
19bfa7851aSJames Wright   *a              = *b;
20bfa7851aSJames Wright   *b              = temp;
21bfa7851aSJames Wright }
22bfa7851aSJames Wright 
23704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Square(CeedScalar x) { return x * x; }
24704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Cube(CeedScalar x) { return x * x * x; }
25704b8bbeSJames Wright 
26e7754af5SKenneth E. Jansen // @brief Scale vector of length N by scalar alpha
27e7754af5SKenneth E. Jansen CEED_QFUNCTION_HELPER void ScaleN(CeedScalar *u, const CeedScalar alpha, const CeedInt N) {
288e5e3595SJames Wright   CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) u[i] *= alpha;
298e5e3595SJames Wright }
308e5e3595SJames Wright 
318e5e3595SJames Wright // @brief Set vector of length N to a value alpha
328e5e3595SJames Wright CEED_QFUNCTION_HELPER void SetValueN(CeedScalar *u, const CeedScalar alpha, const CeedInt N) {
338e5e3595SJames Wright   CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) u[i] = alpha;
348e5e3595SJames Wright }
358e5e3595SJames Wright 
368e5e3595SJames Wright // @brief Copy N elements from x to y
378e5e3595SJames Wright CEED_QFUNCTION_HELPER void CopyN(const CeedScalar *x, CeedScalar *y, const CeedInt N) { CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) y[i] = x[i]; }
388e5e3595SJames Wright 
398e5e3595SJames Wright // @brief Copy 3x3 matrix from A to B
408e5e3595SJames Wright CEED_QFUNCTION_HELPER void CopyMat3(const CeedScalar A[3][3], CeedScalar B[3][3]) { CopyN((const CeedScalar *)A, (CeedScalar *)B, 9); }
418e5e3595SJames Wright 
428e5e3595SJames Wright // @brief Dot product of vectors with N elements
438e5e3595SJames Wright CEED_QFUNCTION_HELPER CeedScalar DotN(const CeedScalar *u, const CeedScalar *v, const CeedInt N) {
448e5e3595SJames Wright   CeedScalar output = 0;
458e5e3595SJames Wright   CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) output += u[i] * v[i];
468e5e3595SJames Wright   return output;
47e7754af5SKenneth E. Jansen }
48e7754af5SKenneth E. Jansen 
49704b8bbeSJames Wright // @brief Dot product of 3 element vectors
508fff8293SJames Wright CEED_QFUNCTION_HELPER CeedScalar Dot3(const CeedScalar *u, const CeedScalar *v) { return u[0] * v[0] + u[1] * v[1] + u[2] * v[2]; }
51704b8bbeSJames Wright 
52*2a28a40bSJames Wright // @brief Dot product of 2 element vectors
53*2a28a40bSJames Wright CEED_QFUNCTION_HELPER CeedScalar Dot2(const CeedScalar *u, const CeedScalar *v) { return u[0] * v[0] + u[1] * v[1]; }
54*2a28a40bSJames Wright 
5564667825SJames Wright // @brief \ell^2 norm of 3 element vectors
5664667825SJames Wright CEED_QFUNCTION_HELPER CeedScalar Norm3(const CeedScalar *u) { return sqrt(u[0] * u[0] + u[1] * u[1] + u[2] * u[2]); }
5764667825SJames Wright 
5883c0b726SJames Wright // @brief \ell^2 norm of 2 element vectors
5983c0b726SJames Wright CEED_QFUNCTION_HELPER CeedScalar Norm2(const CeedScalar *u) { return sqrt(u[0] * u[0] + u[1] * u[1]); }
6083c0b726SJames Wright 
618e5e3595SJames Wright // @brief Cross product of vectors with 3 elements
628e5e3595SJames Wright CEED_QFUNCTION_HELPER void Cross3(const CeedScalar u[3], const CeedScalar v[3], CeedScalar w[3]) {
638e5e3595SJames Wright   w[0] = (u[1] * v[2]) - (u[2] * v[1]);
648e5e3595SJames Wright   w[1] = (u[2] * v[0]) - (u[0] * v[2]);
658e5e3595SJames Wright   w[2] = (u[0] * v[1]) - (u[1] * v[0]);
668e5e3595SJames Wright }
678e5e3595SJames Wright 
688e5e3595SJames Wright // @brief Curl of vector given its gradient
698e5e3595SJames Wright CEED_QFUNCTION_HELPER void Curl3(const CeedScalar gradient[3][3], CeedScalar v[3]) {
708e5e3595SJames Wright   v[0] = gradient[2][1] - gradient[1][2];
718e5e3595SJames Wright   v[1] = gradient[0][2] - gradient[2][0];
728e5e3595SJames Wright   v[2] = gradient[1][0] - gradient[0][1];
738e5e3595SJames Wright }
748e5e3595SJames Wright 
758e5e3595SJames Wright // @brief Matrix vector product, b = Ax + b. A is NxM, x is M, b is N
768e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatVecNM(const CeedScalar *A, const CeedScalar *x, const CeedInt N, const CeedInt M, const CeedTransposeMode transpose_A,
778e5e3595SJames Wright                                     CeedScalar *b) {
788e5e3595SJames Wright   switch (transpose_A) {
798e5e3595SJames Wright     case CEED_NOTRANSPOSE:
808e5e3595SJames Wright       CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) b[i] += DotN(&A[i * M], x, M);
818e5e3595SJames Wright       break;
828e5e3595SJames Wright     case CEED_TRANSPOSE:
838e5e3595SJames Wright       CeedPragmaSIMD for (CeedInt i = 0; i < M; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) b[i] += A[j * M + i] * x[j]; }
848e5e3595SJames Wright       break;
858e5e3595SJames Wright   }
868e5e3595SJames Wright }
878e5e3595SJames Wright 
888e5e3595SJames Wright // @brief 3x3 Matrix vector product  b = Ax + b.
898e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatVec3(const CeedScalar A[3][3], const CeedScalar x[3], const CeedTransposeMode transpose_A, CeedScalar b[3]) {
908e5e3595SJames Wright   MatVecNM((const CeedScalar *)A, (const CeedScalar *)x, 3, 3, transpose_A, (CeedScalar *)b);
918e5e3595SJames Wright }
928e5e3595SJames Wright 
93*2a28a40bSJames Wright // @brief 2x2 Matrix vector product  b = Ax + b.
94*2a28a40bSJames Wright CEED_QFUNCTION_HELPER void MatVec2(const CeedScalar A[2][2], const CeedScalar x[2], const CeedTransposeMode transpose_A, CeedScalar b[2]) {
95*2a28a40bSJames Wright   MatVecNM((const CeedScalar *)A, (const CeedScalar *)x, 2, 2, transpose_A, (CeedScalar *)b);
96*2a28a40bSJames Wright }
97*2a28a40bSJames Wright 
988e5e3595SJames Wright // @brief Matrix-Matrix product, B = DA + B, where D is diagonal.
998e5e3595SJames Wright // @details A is NxM, D is diagonal NxN, represented by a vector of length N, and B is NxM. Optionally, A may be transposed.
1008e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatDiagNM(const CeedScalar *A, const CeedScalar *D, const CeedInt N, const CeedInt M, const CeedTransposeMode transpose_A,
1018e5e3595SJames Wright                                      CeedScalar *B) {
1028e5e3595SJames Wright   switch (transpose_A) {
1038e5e3595SJames Wright     case CEED_NOTRANSPOSE:
1048e5e3595SJames Wright       CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < M; j++) B[i * M + j] += D[i] * A[i * M + j]; }
1058e5e3595SJames Wright       break;
1068e5e3595SJames Wright     case CEED_TRANSPOSE:
1078e5e3595SJames Wright       CeedPragmaSIMD for (CeedInt i = 0; i < M; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) B[i * N + j] += D[i] * A[j * M + i]; }
1088e5e3595SJames Wright       break;
1098e5e3595SJames Wright   }
1108e5e3595SJames Wright }
1118e5e3595SJames Wright 
1128e5e3595SJames Wright // @brief 3x3 Matrix-Matrix product, B = DA + B, where D is diagonal.
1138e5e3595SJames Wright // @details Optionally, A may be transposed.
1148e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatDiag3(const CeedScalar A[3][3], const CeedScalar D[3], const CeedTransposeMode transpose_A, CeedScalar B[3][3]) {
1158e5e3595SJames Wright   MatDiagNM((const CeedScalar *)A, (const CeedScalar *)D, 3, 3, transpose_A, (CeedScalar *)B);
1168e5e3595SJames Wright }
117e975cfccSJames Wright // @brief NxN Matrix-Matrix product, C = AB + C
118e975cfccSJames Wright CEED_QFUNCTION_HELPER void MatMatN(const CeedScalar *A, const CeedScalar *B, const CeedInt N, const CeedTransposeMode transpose_A,
119e975cfccSJames Wright                                    const CeedTransposeMode transpose_B, CeedScalar *C) {
1208e5e3595SJames Wright   switch (transpose_A) {
1218e5e3595SJames Wright     case CEED_NOTRANSPOSE:
1228e5e3595SJames Wright       switch (transpose_B) {
1238e5e3595SJames Wright         case CEED_NOTRANSPOSE:
124e975cfccSJames Wright           CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) {
125e975cfccSJames Wright             CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) {
126e975cfccSJames Wright               CeedPragmaSIMD for (CeedInt k = 0; k < N; k++) C[i * N + j] += A[i * N + k] * B[k * N + j];
127e975cfccSJames Wright             }
1288e5e3595SJames Wright           }
1298e5e3595SJames Wright           break;
1308e5e3595SJames Wright         case CEED_TRANSPOSE:
131e975cfccSJames Wright           CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) {
132e975cfccSJames Wright             CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) {
133e975cfccSJames Wright               CeedPragmaSIMD for (CeedInt k = 0; k < N; k++) C[i * N + j] += A[i * N + k] * B[j * N + k];
134e975cfccSJames Wright             }
1358e5e3595SJames Wright           }
1368e5e3595SJames Wright           break;
1378e5e3595SJames Wright       }
1388e5e3595SJames Wright       break;
1398e5e3595SJames Wright     case CEED_TRANSPOSE:
1408e5e3595SJames Wright       switch (transpose_B) {
1418e5e3595SJames Wright         case CEED_NOTRANSPOSE:
142e975cfccSJames Wright           CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) {
143e975cfccSJames Wright             CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) {
144e975cfccSJames Wright               CeedPragmaSIMD for (CeedInt k = 0; k < N; k++) C[i * N + j] += A[k * N + i] * B[k * N + j];
145e975cfccSJames Wright             }
1468e5e3595SJames Wright           }
1478e5e3595SJames Wright           break;
1488e5e3595SJames Wright         case CEED_TRANSPOSE:
149e975cfccSJames Wright           CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) {
150e975cfccSJames Wright             CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) {
151e975cfccSJames Wright               CeedPragmaSIMD for (CeedInt k = 0; k < N; k++) C[i * N + j] += A[k * N + i] * B[j * N + k];
152e975cfccSJames Wright             }
1538e5e3595SJames Wright           }
1548e5e3595SJames Wright           break;
1558e5e3595SJames Wright       }
1568e5e3595SJames Wright       break;
1578e5e3595SJames Wright   }
1588e5e3595SJames Wright }
1598e5e3595SJames Wright 
160e975cfccSJames Wright // @brief 3x3 Matrix-Matrix product, C = AB + C
161e975cfccSJames Wright CEED_QFUNCTION_HELPER void MatMat3(const CeedScalar A[3][3], const CeedScalar B[3][3], const CeedTransposeMode transpose_A,
162e975cfccSJames Wright                                    const CeedTransposeMode transpose_B, CeedScalar C[3][3]) {
163e975cfccSJames Wright   MatMatN((const CeedScalar *)A, (const CeedScalar *)B, 3, transpose_A, transpose_B, (CeedScalar *)C);
164e975cfccSJames Wright }
165e975cfccSJames Wright 
166*2a28a40bSJames Wright // @brief 2x2 Matrix-Matrix product, C = AB + C
167*2a28a40bSJames Wright CEED_QFUNCTION_HELPER void MatMat2(const CeedScalar A[2][2], const CeedScalar B[2][2], const CeedTransposeMode transpose_A,
168*2a28a40bSJames Wright                                    const CeedTransposeMode transpose_B, CeedScalar C[2][2]) {
169*2a28a40bSJames Wright   MatMatN((const CeedScalar *)A, (const CeedScalar *)B, 2, transpose_A, transpose_B, (CeedScalar *)C);
170*2a28a40bSJames Wright }
171*2a28a40bSJames Wright 
17206f0a019SJames Wright /**
173d8667e38SJames Wright  * @brief Calculate inverse of 2x2 matrix
174d8667e38SJames Wright  *
175d8667e38SJames Wright  * @param[in]  A        Input matrix
176d8667e38SJames Wright  * @param[out] detJ_ptr Determinate of A, may be NULL is not desired
177d8667e38SJames Wright  * @param[out] A_inv    Output matrix inverse
178d8667e38SJames Wright  */
179d8667e38SJames Wright CEED_QFUNCTION_HELPER void MatInv2(const CeedScalar A[2][2], CeedScalar A_inv[2][2], CeedScalar *detJ_ptr) {
180d8667e38SJames Wright   const CeedScalar detJ = A[0][0] * A[1][1] - A[1][0] * A[0][1];
181d8667e38SJames Wright 
182d8667e38SJames Wright   A_inv[0][0] = A[1][1] / detJ;
183d8667e38SJames Wright   A_inv[0][1] = -A[0][1] / detJ;
184d8667e38SJames Wright   A_inv[1][0] = -A[1][0] / detJ;
185d8667e38SJames Wright   A_inv[1][1] = A[0][0] / detJ;
186d8667e38SJames Wright   if (detJ_ptr) *detJ_ptr = detJ;
187d8667e38SJames Wright }
188d8667e38SJames Wright 
189d8667e38SJames Wright /**
190d8667e38SJames Wright  * @brief Calculate inverse of 3x3 matrix
191d8667e38SJames Wright  *
192d8667e38SJames Wright  * @param[in]  A        Input matrix
193d8667e38SJames Wright  * @param[out] detJ_ptr Determinate of A, may be NULL is not desired
194d8667e38SJames Wright  * @param[out] A_inv    Output matrix inverse
195d8667e38SJames Wright  */
196d8667e38SJames Wright CEED_QFUNCTION_HELPER void MatInv3(const CeedScalar A[3][3], CeedScalar A_inv[3][3], CeedScalar *detJ_ptr) {
197d8667e38SJames Wright   // Compute Adjugate of dxdX
198d8667e38SJames Wright   A_inv[0][0] = A[1][1] * A[2][2] - A[1][2] * A[2][1];
199d8667e38SJames Wright   A_inv[0][1] = A[0][2] * A[2][1] - A[0][1] * A[2][2];
200d8667e38SJames Wright   A_inv[0][2] = A[0][1] * A[1][2] - A[0][2] * A[1][1];
201d8667e38SJames Wright   A_inv[1][0] = A[1][2] * A[2][0] - A[1][0] * A[2][2];
202d8667e38SJames Wright   A_inv[1][1] = A[0][0] * A[2][2] - A[0][2] * A[2][0];
203d8667e38SJames Wright   A_inv[1][2] = A[0][2] * A[1][0] - A[0][0] * A[1][2];
204d8667e38SJames Wright   A_inv[2][0] = A[1][0] * A[2][1] - A[1][1] * A[2][0];
205d8667e38SJames Wright   A_inv[2][1] = A[0][1] * A[2][0] - A[0][0] * A[2][1];
206d8667e38SJames Wright   A_inv[2][2] = A[0][0] * A[1][1] - A[0][1] * A[1][0];
207d8667e38SJames Wright 
208d8667e38SJames Wright   const CeedScalar detJ = A[0][0] * A_inv[0][0] + A[1][0] * A_inv[0][1] + A[2][0] * A_inv[0][2];
209d8667e38SJames Wright   ScaleN((CeedScalar *)A_inv, 1 / detJ, 9);
210d8667e38SJames Wright   if (detJ_ptr) *detJ_ptr = detJ;
211d8667e38SJames Wright }
212d8667e38SJames Wright 
213d8667e38SJames Wright /**
21406f0a019SJames Wright   @brief MxN Matrix-Matrix product, C = AB + C
21506f0a019SJames Wright 
21606f0a019SJames Wright   C is NxM, A is NxP, B is PxM
21706f0a019SJames Wright 
21806f0a019SJames Wright   @param[in]  mat_A Row-major matrix `A`
21906f0a019SJames Wright   @param[in]  mat_B Row-major matrix `B`
22006f0a019SJames Wright   @param[out] mat_C Row-major output matrix `C`
22106f0a019SJames Wright   @param[in]  N     Number of rows of `C`
22206f0a019SJames Wright   @param[in]  M     Number of columns of `C`
22306f0a019SJames Wright   @param[in]  P     Number of columns of `A`/rows of `B`
22406f0a019SJames Wright **/
22506f0a019SJames Wright CEED_QFUNCTION_HELPER void MatMatNM(const CeedScalar *mat_A, const CeedScalar *mat_B, CeedScalar *mat_C, CeedInt N, CeedInt M, CeedInt P) {
22606f0a019SJames Wright   for (CeedInt i = 0; i < N; i++) {
22706f0a019SJames Wright     for (CeedInt j = 0; j < M; j++) {
22806f0a019SJames Wright       for (CeedInt k = 0; k < P; k++) mat_C[i * M + j] += mat_A[i * P + k] * mat_B[k * M + j];
22906f0a019SJames Wright     }
23006f0a019SJames Wright   }
23106f0a019SJames Wright }
23206f0a019SJames Wright 
233704b8bbeSJames Wright // @brief Unpack Kelvin-Mandel notation symmetric tensor into full tensor
234704b8bbeSJames Wright CEED_QFUNCTION_HELPER void KMUnpack(const CeedScalar v[6], CeedScalar A[3][3]) {
235704b8bbeSJames Wright   const CeedScalar weight = 1 / sqrt(2.);
236704b8bbeSJames Wright   A[0][0]                 = v[0];
237704b8bbeSJames Wright   A[1][1]                 = v[1];
238704b8bbeSJames Wright   A[2][2]                 = v[2];
239704b8bbeSJames Wright   A[2][1] = A[1][2] = weight * v[3];
240704b8bbeSJames Wright   A[2][0] = A[0][2] = weight * v[4];
241704b8bbeSJames Wright   A[1][0] = A[0][1] = weight * v[5];
242704b8bbeSJames Wright }
243704b8bbeSJames Wright 
2448e5e3595SJames Wright // @brief Pack full tensor into Kelvin-Mandel notation symmetric tensor
2458e5e3595SJames Wright CEED_QFUNCTION_HELPER void KMPack(const CeedScalar A[3][3], CeedScalar v[6]) {
2468e5e3595SJames Wright   const CeedScalar weight = sqrt(2.);
2478e5e3595SJames Wright   v[0]                    = A[0][0];
2488e5e3595SJames Wright   v[1]                    = A[1][1];
2498e5e3595SJames Wright   v[2]                    = A[2][2];
2508e5e3595SJames Wright   v[3]                    = A[2][1] * weight;
2518e5e3595SJames Wright   v[4]                    = A[2][0] * weight;
2528e5e3595SJames Wright   v[5]                    = A[1][0] * weight;
2538e5e3595SJames Wright }
2548e5e3595SJames Wright 
2558e5e3595SJames Wright // @brief Calculate metric tensor from mapping, g_{ij} = xi_{k,i} xi_{k,j} = dXdx^T dXdx
2568e5e3595SJames Wright CEED_QFUNCTION_HELPER void KMMetricTensor(const CeedScalar dXdx[3][3], CeedScalar km_g_ij[6]) {
2578e5e3595SJames Wright   CeedScalar g_ij[3][3] = {{0.}};
2588e5e3595SJames Wright   MatMat3(dXdx, dXdx, CEED_TRANSPOSE, CEED_NOTRANSPOSE, g_ij);
2598e5e3595SJames Wright   KMPack(g_ij, km_g_ij);
2608e5e3595SJames Wright }
2618e5e3595SJames Wright 
262e7754af5SKenneth E. Jansen // @brief Linear ramp evaluation
263e7754af5SKenneth E. Jansen CEED_QFUNCTION_HELPER CeedScalar LinearRampCoefficient(CeedScalar amplitude, CeedScalar length, CeedScalar start, CeedScalar x) {
264e7754af5SKenneth E. Jansen   if (x < start) {
265e7754af5SKenneth E. Jansen     return amplitude;
266e7754af5SKenneth E. Jansen   } else if (x < start + length) {
267e7754af5SKenneth E. Jansen     return amplitude * ((x - start) * (-1 / length) + 1);
268e7754af5SKenneth E. Jansen   } else {
269e7754af5SKenneth E. Jansen     return 0;
270e7754af5SKenneth E. Jansen   }
271e7754af5SKenneth E. Jansen }
272e7754af5SKenneth E. Jansen 
273ade49511SJames Wright /**
274ade49511SJames Wright   @brief Pack stored values at quadrature point
275ade49511SJames Wright 
276ade49511SJames Wright   @param[in]   Q              Number of quadrature points
277ade49511SJames Wright   @param[in]   i              Current quadrature point
278ade49511SJames Wright   @param[in]   start          Starting index to store components
279ade49511SJames Wright   @param[in]   num_comp       Number of components to store
2806764667bSJames Wright   @param[in]   values_at_qpnt Local values for quadrature point i
281ade49511SJames Wright   @param[out]  stored         Stored values
282ade49511SJames Wright 
283ade49511SJames Wright   @return An error code: 0 - success, otherwise - failure
284ade49511SJames Wright **/
2856764667bSJames Wright CEED_QFUNCTION_HELPER int StoredValuesPack(CeedInt Q, CeedInt i, CeedInt start, CeedInt num_comp, const CeedScalar *values_at_qpnt,
2866764667bSJames Wright                                            CeedScalar *stored) {
2876764667bSJames Wright   for (CeedInt j = 0; j < num_comp; j++) stored[(start + j) * Q + i] = values_at_qpnt[j];
288ade49511SJames Wright 
289ade49511SJames Wright   return CEED_ERROR_SUCCESS;
290ade49511SJames Wright }
291ade49511SJames Wright 
292ade49511SJames Wright /**
293ade49511SJames Wright   @brief Unpack stored values at quadrature point
294ade49511SJames Wright 
295ade49511SJames Wright   @param[in]   Q              Number of quadrature points
296ade49511SJames Wright   @param[in]   i              Current quadrature point
297ade49511SJames Wright   @param[in]   start          Starting index to store components
298ade49511SJames Wright   @param[in]   num_comp       Number of components to store
299ade49511SJames Wright   @param[in]   stored         Stored values
3006764667bSJames Wright   @param[out]  values_at_qpnt Local values for quadrature point i
301ade49511SJames Wright 
302ade49511SJames Wright   @return An error code: 0 - success, otherwise - failure
303ade49511SJames Wright **/
3046764667bSJames Wright CEED_QFUNCTION_HELPER int StoredValuesUnpack(CeedInt Q, CeedInt i, CeedInt start, CeedInt num_comp, const CeedScalar *stored,
3056764667bSJames Wright                                              CeedScalar *values_at_qpnt) {
3066764667bSJames Wright   for (CeedInt j = 0; j < num_comp; j++) values_at_qpnt[j] = stored[(start + j) * Q + i];
307ade49511SJames Wright 
308ade49511SJames Wright   return CEED_ERROR_SUCCESS;
309ade49511SJames Wright }
310ade49511SJames Wright 
311ade49511SJames Wright /**
312e1bedf8cSJames Wright   @brief Unpack N-D element q_data at quadrature point
313e1bedf8cSJames Wright 
314e1bedf8cSJames Wright   @param[in]   dim       Dimension of the element
315e1bedf8cSJames Wright   @param[in]   Q         Number of quadrature points
316e1bedf8cSJames Wright   @param[in]   i         Current quadrature point
317e1bedf8cSJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:Setup`)
318e1bedf8cSJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
319e1bedf8cSJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [dim][dim]), or `NULL`
320e77831d2SJames Wright 
321e77831d2SJames Wright   @return An error code: 0 - success, otherwise - failure
322e1bedf8cSJames Wright **/
323e77831d2SJames Wright CEED_QFUNCTION_HELPER int QdataUnpack_ND(CeedInt dim, CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar *dXdx) {
324e1bedf8cSJames Wright   switch (dim) {
325e1bedf8cSJames Wright     case 2:
326e1bedf8cSJames Wright       if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ);
327e1bedf8cSJames Wright       if (dXdx) StoredValuesUnpack(Q, i, 1, 4, q_data, dXdx);
328e1bedf8cSJames Wright       break;
329e1bedf8cSJames Wright     case 3:
330e1bedf8cSJames Wright       if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ);
331e1bedf8cSJames Wright       if (dXdx) StoredValuesUnpack(Q, i, 1, 9, q_data, dXdx);
332e1bedf8cSJames Wright       break;
333e1bedf8cSJames Wright   }
334e77831d2SJames Wright   return CEED_ERROR_SUCCESS;
335e1bedf8cSJames Wright }
336e1bedf8cSJames Wright 
337e1bedf8cSJames Wright /**
338e1bedf8cSJames Wright   @brief Unpack boundary element q_data for N-D problem at quadrature point
339e1bedf8cSJames Wright 
340e77831d2SJames Wright   @param[in]   dim       Dimension of the element
341e1bedf8cSJames Wright   @param[in]   Q         Number of quadrature points
342e1bedf8cSJames Wright   @param[in]   i         Current quadrature point
343e1bedf8cSJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:SetupBoundary`)
344e1bedf8cSJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
345e1bedf8cSJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [dim - 1][dim]), or `NULL`
346e1bedf8cSJames Wright   @param[out]  normal    Components of the normal vector (shape [dim]), or `NULL`
347e77831d2SJames Wright 
348e77831d2SJames Wright   @return An error code: 0 - success, otherwise - failure
349e1bedf8cSJames Wright **/
350e77831d2SJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryUnpack_ND(CeedInt dim, CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar *dXdx,
351e1bedf8cSJames Wright                                                  CeedScalar *normal) {
352e1bedf8cSJames Wright   switch (dim) {
353e1bedf8cSJames Wright     case 2:
354e1bedf8cSJames Wright       if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ);
355e1bedf8cSJames Wright       if (normal) StoredValuesUnpack(Q, i, 1, 2, q_data, normal);
356e1bedf8cSJames Wright       break;
357e1bedf8cSJames Wright     case 3:
358e1bedf8cSJames Wright       if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ);
359e1bedf8cSJames Wright       if (normal) StoredValuesUnpack(Q, i, 1, 3, q_data, normal);
360e1bedf8cSJames Wright       if (dXdx) StoredValuesUnpack(Q, i, 4, 6, q_data, (CeedScalar *)dXdx);
361e1bedf8cSJames Wright       break;
362e1bedf8cSJames Wright   }
363e77831d2SJames Wright   return CEED_ERROR_SUCCESS;
364e1bedf8cSJames Wright }
365e1bedf8cSJames Wright 
366e1bedf8cSJames Wright /**
367da8b59d6SJames Wright   @brief Unpack boundary element q_data for N-D problem at quadrature point
368da8b59d6SJames Wright 
369da8b59d6SJames Wright   @param[in]   dim       Dimension of the element
370da8b59d6SJames Wright   @param[in]   Q         Number of quadrature points
371da8b59d6SJames Wright   @param[in]   i         Current quadrature point
372da8b59d6SJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:SetupBoundaryGradient`)
373da8b59d6SJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
374da8b59d6SJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [dim][dim]), or `NULL`
375da8b59d6SJames Wright   @param[out]  normal    Components of the normal vector (shape [dim]), or `NULL`
376da8b59d6SJames Wright 
377da8b59d6SJames Wright   @return An error code: 0 - success, otherwise - failure
378da8b59d6SJames Wright **/
379da8b59d6SJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryGradientUnpack_ND(CeedInt dim, CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ,
380da8b59d6SJames Wright                                                          CeedScalar *dXdx, CeedScalar *normal) {
381da8b59d6SJames Wright   switch (dim) {
382da8b59d6SJames Wright     case 2:
383da8b59d6SJames Wright       if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ);
384da8b59d6SJames Wright       if (dXdx) StoredValuesUnpack(Q, i, 1, 4, q_data, dXdx);
385da8b59d6SJames Wright       if (normal) StoredValuesUnpack(Q, i, 5, 2, q_data, normal);
386da8b59d6SJames Wright       break;
387da8b59d6SJames Wright     case 3:
388da8b59d6SJames Wright       if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ);
389da8b59d6SJames Wright       if (dXdx) StoredValuesUnpack(Q, i, 1, 9, q_data, dXdx);
390da8b59d6SJames Wright       if (normal) StoredValuesUnpack(Q, i, 10, 3, q_data, normal);
391da8b59d6SJames Wright       break;
392da8b59d6SJames Wright   }
393da8b59d6SJames Wright   return CEED_ERROR_SUCCESS;
394da8b59d6SJames Wright }
395da8b59d6SJames Wright 
396da8b59d6SJames Wright /**
397ade49511SJames Wright   @brief Unpack 3D element q_data at quadrature point
398ade49511SJames Wright 
399ade49511SJames Wright   @param[in]   Q         Number of quadrature points
400ade49511SJames Wright   @param[in]   i         Current quadrature point
401ade49511SJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:Setup`)
402ade49511SJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian
403ade49511SJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [3][3])
404ade49511SJames Wright 
405ade49511SJames Wright   @return An error code: 0 - success, otherwise - failure
406ade49511SJames Wright **/
407ade49511SJames Wright CEED_QFUNCTION_HELPER int QdataUnpack_3D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[3][3]) {
408e77831d2SJames Wright   return QdataUnpack_ND(3, Q, i, q_data, wdetJ, (CeedScalar *)dXdx);
409ade49511SJames Wright }
410ade49511SJames Wright 
411ade49511SJames Wright /**
412ade49511SJames Wright   @brief Unpack boundary element q_data for 3D problem at quadrature point
413ade49511SJames Wright 
414ade49511SJames Wright   @param[in]   Q         Number of quadrature points
415ade49511SJames Wright   @param[in]   i         Current quadrature point
4162c512a7bSJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:SetupBoundary`)
417ade49511SJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
418ade49511SJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [2][3]), or `NULL`
419ade49511SJames Wright   @param[out]  normal    Components of the normal vector (shape [3]), or `NULL`
420ade49511SJames Wright 
421ade49511SJames Wright   @return An error code: 0 - success, otherwise - failure
422ade49511SJames Wright **/
423ade49511SJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryUnpack_3D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[2][3],
424ade49511SJames Wright                                                  CeedScalar normal[3]) {
425e77831d2SJames Wright   return QdataBoundaryUnpack_ND(3, Q, i, q_data, wdetJ, (CeedScalar *)dXdx, normal);
426ade49511SJames Wright }
427ade49511SJames Wright 
428baadde1fSJames Wright /**
42915c15616SJames Wright   @brief Unpack boundary element q_data for 3D problem at quadrature point
43015c15616SJames Wright 
43115c15616SJames Wright   @param[in]   Q         Number of quadrature points
43215c15616SJames Wright   @param[in]   i         Current quadrature point
43315c15616SJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:SetupBoundary`)
43415c15616SJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
435e77831d2SJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [3][3]), or `NULL`
43615c15616SJames Wright   @param[out]  normal    Components of the normal vector (shape [3]), or `NULL`
43715c15616SJames Wright 
43815c15616SJames Wright   @return An error code: 0 - success, otherwise - failure
43915c15616SJames Wright **/
440e77831d2SJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryGradientUnpack_3D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[3][3],
44115c15616SJames Wright                                                          CeedScalar normal[3]) {
442da8b59d6SJames Wright   return QdataBoundaryGradientUnpack_ND(3, Q, i, q_data, wdetJ, (CeedScalar *)dXdx, normal);
44315c15616SJames Wright }
44415c15616SJames Wright 
44515c15616SJames Wright /**
446baadde1fSJames Wright   @brief Unpack 2D element q_data at quadrature point
447baadde1fSJames Wright 
448baadde1fSJames Wright   @param[in]   Q         Number of quadrature points
449baadde1fSJames Wright   @param[in]   i         Current quadrature point
450baadde1fSJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:Setup`)
451baadde1fSJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian
452baadde1fSJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [2][2])
453baadde1fSJames Wright 
454baadde1fSJames Wright   @return An error code: 0 - success, otherwise - failure
455baadde1fSJames Wright **/
456baadde1fSJames Wright CEED_QFUNCTION_HELPER int QdataUnpack_2D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[2][2]) {
457e1bedf8cSJames Wright   QdataUnpack_ND(2, Q, i, q_data, wdetJ, (CeedScalar *)dXdx);
458baadde1fSJames Wright   return CEED_ERROR_SUCCESS;
459baadde1fSJames Wright }
460baadde1fSJames Wright 
4612c512a7bSJames Wright /**
4622c512a7bSJames Wright   @brief Unpack boundary element q_data for 2D problem at quadrature point
4632c512a7bSJames Wright 
4642c512a7bSJames Wright   @param[in]   Q         Number of quadrature points
4652c512a7bSJames Wright   @param[in]   i         Current quadrature point
4662c512a7bSJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:SetupBoundary2d`)
4672c512a7bSJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
4682c512a7bSJames Wright   @param[out]  normal    Components of the normal vector (shape [2]), or `NULL`
4692c512a7bSJames Wright 
4702c512a7bSJames Wright   @return An error code: 0 - success, otherwise - failure
4712c512a7bSJames Wright **/
4722c512a7bSJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryUnpack_2D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar normal[2]) {
473e1bedf8cSJames Wright   QdataBoundaryUnpack_ND(3, Q, i, q_data, wdetJ, NULL, normal);
4742c512a7bSJames Wright   return CEED_ERROR_SUCCESS;
4752c512a7bSJames Wright }
47606f0a019SJames Wright 
47706f0a019SJames Wright /**
478da8b59d6SJames Wright   @brief Unpack boundary element q_data for 2D problem at quadrature point
479da8b59d6SJames Wright 
480da8b59d6SJames Wright   @param[in]   Q         Number of quadrature points
481da8b59d6SJames Wright   @param[in]   i         Current quadrature point
482da8b59d6SJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:SetupBoundary`)
483da8b59d6SJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
484da8b59d6SJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [2][2]), or `NULL`
485da8b59d6SJames Wright   @param[out]  normal    Components of the normal vector (shape [2]), or `NULL`
486da8b59d6SJames Wright 
487da8b59d6SJames Wright   @return An error code: 0 - success, otherwise - failure
488da8b59d6SJames Wright **/
489da8b59d6SJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryGradientUnpack_2D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[2][2],
490da8b59d6SJames Wright                                                          CeedScalar normal[2]) {
491da8b59d6SJames Wright   return QdataBoundaryGradientUnpack_ND(2, Q, i, q_data, wdetJ, (CeedScalar *)dXdx, normal);
492da8b59d6SJames Wright }
493da8b59d6SJames Wright 
494da8b59d6SJames Wright /**
49506f0a019SJames Wright   @brief Unpack `CEED_EVAL_GRAD` QF input into quadrature-point local array
49606f0a019SJames Wright 
49706f0a019SJames Wright   @param[in]  Q          Number of quadrature points
49806f0a019SJames Wright   @param[in]  i          Current quadrature point
49906f0a019SJames Wright   @param[in]  num_comp   Number of components of the input
50006f0a019SJames Wright   @param[in]  dim        Topological dimension of the element (ie. number of derivative terms per component)
50106f0a019SJames Wright   @param[in]  grad       QF gradient input, shape `[dim][num_comp][Q]`
502db7fbcd2SJames Wright   @param[out] grad_local Gradient array at quadrature point Q, shape `[num_comp][dim]`
50306f0a019SJames Wright **/
504db7fbcd2SJames Wright CEED_QFUNCTION_HELPER void GradUnpackN(CeedInt Q, CeedInt i, CeedInt num_comp, CeedInt dim, const CeedScalar *grad, CeedScalar *grad_local) {
50506f0a019SJames Wright   for (CeedInt d = 0; d < dim; d++) {
50606f0a019SJames Wright     for (CeedInt c = 0; c < num_comp; c++) {
507db7fbcd2SJames Wright       grad_local[dim * c + d] = grad[(Q * num_comp) * d + Q * c + i];
50806f0a019SJames Wright     }
50906f0a019SJames Wright   }
51006f0a019SJames Wright }
51106f0a019SJames Wright 
51206f0a019SJames Wright /**
51306f0a019SJames Wright   @brief Unpack `CEED_EVAL_GRAD` QF input into quadrature-point local array for 3D elements
51406f0a019SJames Wright 
51506f0a019SJames Wright   @param[in]  Q          Number of quadrature points
51606f0a019SJames Wright   @param[in]  i          Current quadrature point
51706f0a019SJames Wright   @param[in]  num_comp   Number of components of the input
51883c0b726SJames Wright   @param[in]  grad       QF gradient input, shape `[3][num_comp][Q]`
519db7fbcd2SJames Wright   @param[out] grad_local Gradient array at quadrature point Q, shape `[num_comp][3]`
52006f0a019SJames Wright **/
521db7fbcd2SJames Wright CEED_QFUNCTION_HELPER void GradUnpack3(CeedInt Q, CeedInt i, CeedInt num_comp, const CeedScalar *grad, CeedScalar (*grad_local)[3]) {
522db7fbcd2SJames Wright   GradUnpackN(Q, i, num_comp, 3, grad, (CeedScalar *)grad_local);
52306f0a019SJames Wright }
5248c85b835SJames Wright 
5258c85b835SJames Wright /**
52683c0b726SJames Wright   @brief Unpack `CEED_EVAL_GRAD` QF input into quadrature-point local array for 2D elements
52783c0b726SJames Wright 
52883c0b726SJames Wright   @param[in]  Q          Number of quadrature points
52983c0b726SJames Wright   @param[in]  i          Current quadrature point
53083c0b726SJames Wright   @param[in]  num_comp   Number of components of the input
53183c0b726SJames Wright   @param[in]  grad       QF gradient input, shape `[2][num_comp][Q]`
532db7fbcd2SJames Wright   @param[out] grad_local Gradient array at quadrature point Q, shape `[num_comp][2]`
53383c0b726SJames Wright **/
534db7fbcd2SJames Wright CEED_QFUNCTION_HELPER void GradUnpack2(CeedInt Q, CeedInt i, CeedInt num_comp, const CeedScalar *grad, CeedScalar (*grad_local)[2]) {
535db7fbcd2SJames Wright   GradUnpackN(Q, i, num_comp, 2, grad, (CeedScalar *)grad_local);
53683c0b726SJames Wright }
53783c0b726SJames Wright 
53883c0b726SJames Wright /**
5398c85b835SJames Wright   @brief Calculate divergence from reference gradient
5408c85b835SJames Wright 
5418c85b835SJames Wright   Given gradient array G_{ij} and inverse element mapping X_{ij}, then the divergence is
5428c85b835SJames Wright 
5438c85b835SJames Wright   G_{ij} X{ji}
5448c85b835SJames Wright 
5458c85b835SJames Wright   @param[in]  grad_qn    Gradient array, orientation [vector component][gradient direction]
5468c85b835SJames Wright   @param[in]  dXdx       Inverse of the mapping Jacobian (shape [dim][dim])
5478c85b835SJames Wright   @param[in]  dim        Dimension of the problem
5488c85b835SJames Wright   @param[out] divergence The divergence
5498c85b835SJames Wright **/
5508c85b835SJames Wright CEED_QFUNCTION_HELPER void DivergenceND(const CeedScalar *grad_qn, const CeedScalar *dXdx, const CeedInt dim, CeedScalar *divergence) {
5518c85b835SJames Wright   for (CeedInt i = 0; i < dim; i++) {
5528c85b835SJames Wright     for (CeedInt j = 0; j < dim; j++) {
5538c85b835SJames Wright       *divergence += grad_qn[i * dim + j] * dXdx[j * dim + i];
5548c85b835SJames Wright     }
5558c85b835SJames Wright   }
5568c85b835SJames Wright }
5578c85b835SJames Wright 
5588c85b835SJames Wright /**
5598c85b835SJames Wright   @brief Calculate divergence from reference gradient for 3D problem
5608c85b835SJames Wright 
5618c85b835SJames Wright   Given gradient array G_{ij} and inverse element mapping X_{ij}, then the divergence is
5628c85b835SJames Wright 
5638c85b835SJames Wright   G_{ij} X{ji}
5648c85b835SJames Wright 
5658c85b835SJames Wright   @param[in]  grad_qn    Gradient array, orientation [vector component][gradient direction]
5668c85b835SJames Wright   @param[in]  dXdx       Inverse of the mapping Jacobian (shape [3][3])
5678c85b835SJames Wright   @param[out] divergence The divergence
5688c85b835SJames Wright **/
5698c85b835SJames Wright CEED_QFUNCTION_HELPER void Divergence3D(const CeedScalar grad_qn[3][3], const CeedScalar dXdx[3][3], CeedScalar *divergence) {
5708c85b835SJames Wright   DivergenceND((const CeedScalar *)grad_qn, (const CeedScalar *)dXdx, 3, divergence);
5718c85b835SJames Wright }
572