xref: /honee/qfunctions/utils.h (revision ade4951188ee005b66ffd0a9de0bd2ad8f48d7f6)
1704b8bbeSJames Wright // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors.
2704b8bbeSJames Wright // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
3704b8bbeSJames Wright //
4704b8bbeSJames Wright // SPDX-License-Identifier: BSD-2-Clause
5704b8bbeSJames Wright //
6704b8bbeSJames Wright // This file is part of CEED:  http://github.com/ceed
7704b8bbeSJames Wright 
8704b8bbeSJames Wright #ifndef utils_h
9704b8bbeSJames Wright #define utils_h
10704b8bbeSJames Wright 
11704b8bbeSJames Wright #include <ceed.h>
12d0cce58aSJeremy L Thompson #include <math.h>
13704b8bbeSJames Wright 
14704b8bbeSJames Wright #ifndef M_PI
15704b8bbeSJames Wright #define M_PI 3.14159265358979323846
16704b8bbeSJames Wright #endif
17704b8bbeSJames Wright 
18704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Max(CeedScalar a, CeedScalar b) { return a < b ? b : a; }
19704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Min(CeedScalar a, CeedScalar b) { return a < b ? a : b; }
20704b8bbeSJames Wright 
21bfa7851aSJames Wright CEED_QFUNCTION_HELPER void SwapScalar(CeedScalar *a, CeedScalar *b) {
22bfa7851aSJames Wright   CeedScalar temp = *a;
23bfa7851aSJames Wright   *a              = *b;
24bfa7851aSJames Wright   *b              = temp;
25bfa7851aSJames Wright }
26bfa7851aSJames Wright 
27704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Square(CeedScalar x) { return x * x; }
28704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Cube(CeedScalar x) { return x * x * x; }
29704b8bbeSJames Wright 
30e7754af5SKenneth E. Jansen // @brief Scale vector of length N by scalar alpha
31e7754af5SKenneth E. Jansen CEED_QFUNCTION_HELPER void ScaleN(CeedScalar *u, const CeedScalar alpha, const CeedInt N) {
328e5e3595SJames Wright   CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) u[i] *= alpha;
338e5e3595SJames Wright }
348e5e3595SJames Wright 
358e5e3595SJames Wright // @brief Set vector of length N to a value alpha
368e5e3595SJames Wright CEED_QFUNCTION_HELPER void SetValueN(CeedScalar *u, const CeedScalar alpha, const CeedInt N) {
378e5e3595SJames Wright   CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) u[i] = alpha;
388e5e3595SJames Wright }
398e5e3595SJames Wright 
408e5e3595SJames Wright // @brief Copy N elements from x to y
418e5e3595SJames Wright CEED_QFUNCTION_HELPER void CopyN(const CeedScalar *x, CeedScalar *y, const CeedInt N) { CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) y[i] = x[i]; }
428e5e3595SJames Wright 
438e5e3595SJames Wright // @brief Copy 3x3 matrix from A to B
448e5e3595SJames Wright CEED_QFUNCTION_HELPER void CopyMat3(const CeedScalar A[3][3], CeedScalar B[3][3]) { CopyN((const CeedScalar *)A, (CeedScalar *)B, 9); }
458e5e3595SJames Wright 
468e5e3595SJames Wright // @brief Dot product of vectors with N elements
478e5e3595SJames Wright CEED_QFUNCTION_HELPER CeedScalar DotN(const CeedScalar *u, const CeedScalar *v, const CeedInt N) {
488e5e3595SJames Wright   CeedScalar output = 0;
498e5e3595SJames Wright   CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) output += u[i] * v[i];
508e5e3595SJames Wright   return output;
51e7754af5SKenneth E. Jansen }
52e7754af5SKenneth E. Jansen 
53704b8bbeSJames Wright // @brief Dot product of 3 element vectors
548fff8293SJames Wright CEED_QFUNCTION_HELPER CeedScalar Dot3(const CeedScalar *u, const CeedScalar *v) { return u[0] * v[0] + u[1] * v[1] + u[2] * v[2]; }
55704b8bbeSJames Wright 
568e5e3595SJames Wright // @brief Cross product of vectors with 3 elements
578e5e3595SJames Wright CEED_QFUNCTION_HELPER void Cross3(const CeedScalar u[3], const CeedScalar v[3], CeedScalar w[3]) {
588e5e3595SJames Wright   w[0] = (u[1] * v[2]) - (u[2] * v[1]);
598e5e3595SJames Wright   w[1] = (u[2] * v[0]) - (u[0] * v[2]);
608e5e3595SJames Wright   w[2] = (u[0] * v[1]) - (u[1] * v[0]);
618e5e3595SJames Wright }
628e5e3595SJames Wright 
638e5e3595SJames Wright // @brief Curl of vector given its gradient
648e5e3595SJames Wright CEED_QFUNCTION_HELPER void Curl3(const CeedScalar gradient[3][3], CeedScalar v[3]) {
658e5e3595SJames Wright   v[0] = gradient[2][1] - gradient[1][2];
668e5e3595SJames Wright   v[1] = gradient[0][2] - gradient[2][0];
678e5e3595SJames Wright   v[2] = gradient[1][0] - gradient[0][1];
688e5e3595SJames Wright }
698e5e3595SJames Wright 
708e5e3595SJames Wright // @brief Matrix vector product, b = Ax + b. A is NxM, x is M, b is N
718e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatVecNM(const CeedScalar *A, const CeedScalar *x, const CeedInt N, const CeedInt M, const CeedTransposeMode transpose_A,
728e5e3595SJames Wright                                     CeedScalar *b) {
738e5e3595SJames Wright   switch (transpose_A) {
748e5e3595SJames Wright     case CEED_NOTRANSPOSE:
758e5e3595SJames Wright       CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) b[i] += DotN(&A[i * M], x, M);
768e5e3595SJames Wright       break;
778e5e3595SJames Wright     case CEED_TRANSPOSE:
788e5e3595SJames Wright       CeedPragmaSIMD for (CeedInt i = 0; i < M; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) b[i] += A[j * M + i] * x[j]; }
798e5e3595SJames Wright       break;
808e5e3595SJames Wright   }
818e5e3595SJames Wright }
828e5e3595SJames Wright 
838e5e3595SJames Wright // @brief 3x3 Matrix vector product  b = Ax + b.
848e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatVec3(const CeedScalar A[3][3], const CeedScalar x[3], const CeedTransposeMode transpose_A, CeedScalar b[3]) {
858e5e3595SJames Wright   MatVecNM((const CeedScalar *)A, (const CeedScalar *)x, 3, 3, transpose_A, (CeedScalar *)b);
868e5e3595SJames Wright }
878e5e3595SJames Wright 
888e5e3595SJames Wright // @brief Matrix-Matrix product, B = DA + B, where D is diagonal.
898e5e3595SJames Wright // @details A is NxM, D is diagonal NxN, represented by a vector of length N, and B is NxM. Optionally, A may be transposed.
908e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatDiagNM(const CeedScalar *A, const CeedScalar *D, const CeedInt N, const CeedInt M, const CeedTransposeMode transpose_A,
918e5e3595SJames Wright                                      CeedScalar *B) {
928e5e3595SJames Wright   switch (transpose_A) {
938e5e3595SJames Wright     case CEED_NOTRANSPOSE:
948e5e3595SJames Wright       CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < M; j++) B[i * M + j] += D[i] * A[i * M + j]; }
958e5e3595SJames Wright       break;
968e5e3595SJames Wright     case CEED_TRANSPOSE:
978e5e3595SJames Wright       CeedPragmaSIMD for (CeedInt i = 0; i < M; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) B[i * N + j] += D[i] * A[j * M + i]; }
988e5e3595SJames Wright       break;
998e5e3595SJames Wright   }
1008e5e3595SJames Wright }
1018e5e3595SJames Wright 
1028e5e3595SJames Wright // @brief 3x3 Matrix-Matrix product, B = DA + B, where D is diagonal.
1038e5e3595SJames Wright // @details Optionally, A may be transposed.
1048e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatDiag3(const CeedScalar A[3][3], const CeedScalar D[3], const CeedTransposeMode transpose_A, CeedScalar B[3][3]) {
1058e5e3595SJames Wright   MatDiagNM((const CeedScalar *)A, (const CeedScalar *)D, 3, 3, transpose_A, (CeedScalar *)B);
1068e5e3595SJames Wright }
1078e5e3595SJames Wright 
1088e5e3595SJames Wright // @brief 3x3 Matrix-Matrix product, C = AB + C
1098e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatMat3(const CeedScalar A[3][3], const CeedScalar B[3][3], const CeedTransposeMode transpose_A,
1108e5e3595SJames Wright                                    const CeedTransposeMode transpose_B, CeedScalar C[3][3]) {
1118e5e3595SJames Wright   switch (transpose_A) {
1128e5e3595SJames Wright     case CEED_NOTRANSPOSE:
1138e5e3595SJames Wright       switch (transpose_B) {
1148e5e3595SJames Wright         case CEED_NOTRANSPOSE:
1158e5e3595SJames Wright           CeedPragmaSIMD for (CeedInt i = 0; i < 3; i++) {
1168e5e3595SJames Wright             CeedPragmaSIMD for (CeedInt j = 0; j < 3; j++) { CeedPragmaSIMD for (CeedInt k = 0; k < 3; k++) C[i][j] += A[i][k] * B[k][j]; }
1178e5e3595SJames Wright           }
1188e5e3595SJames Wright           break;
1198e5e3595SJames Wright         case CEED_TRANSPOSE:
1208e5e3595SJames Wright           CeedPragmaSIMD for (CeedInt i = 0; i < 3; i++) {
1218e5e3595SJames Wright             CeedPragmaSIMD for (CeedInt j = 0; j < 3; j++) { CeedPragmaSIMD for (CeedInt k = 0; k < 3; k++) C[i][j] += A[i][k] * B[j][k]; }
1228e5e3595SJames Wright           }
1238e5e3595SJames Wright           break;
1248e5e3595SJames Wright       }
1258e5e3595SJames Wright       break;
1268e5e3595SJames Wright     case CEED_TRANSPOSE:
1278e5e3595SJames Wright       switch (transpose_B) {
1288e5e3595SJames Wright         case CEED_NOTRANSPOSE:
1298e5e3595SJames Wright           CeedPragmaSIMD for (CeedInt i = 0; i < 3; i++) {
1308e5e3595SJames Wright             CeedPragmaSIMD for (CeedInt j = 0; j < 3; j++) { CeedPragmaSIMD for (CeedInt k = 0; k < 3; k++) C[i][j] += A[k][i] * B[k][j]; }
1318e5e3595SJames Wright           }
1328e5e3595SJames Wright           break;
1338e5e3595SJames Wright         case CEED_TRANSPOSE:
1348e5e3595SJames Wright           CeedPragmaSIMD for (CeedInt i = 0; i < 3; i++) {
1358e5e3595SJames Wright             CeedPragmaSIMD for (CeedInt j = 0; j < 3; j++) { CeedPragmaSIMD for (CeedInt k = 0; k < 3; k++) C[i][j] += A[k][i] * B[j][k]; }
1368e5e3595SJames Wright           }
1378e5e3595SJames Wright           break;
1388e5e3595SJames Wright       }
1398e5e3595SJames Wright       break;
1408e5e3595SJames Wright   }
1418e5e3595SJames Wright }
1428e5e3595SJames Wright 
143704b8bbeSJames Wright // @brief Unpack Kelvin-Mandel notation symmetric tensor into full tensor
144704b8bbeSJames Wright CEED_QFUNCTION_HELPER void KMUnpack(const CeedScalar v[6], CeedScalar A[3][3]) {
145704b8bbeSJames Wright   const CeedScalar weight = 1 / sqrt(2.);
146704b8bbeSJames Wright   A[0][0]                 = v[0];
147704b8bbeSJames Wright   A[1][1]                 = v[1];
148704b8bbeSJames Wright   A[2][2]                 = v[2];
149704b8bbeSJames Wright   A[2][1] = A[1][2] = weight * v[3];
150704b8bbeSJames Wright   A[2][0] = A[0][2] = weight * v[4];
151704b8bbeSJames Wright   A[1][0] = A[0][1] = weight * v[5];
152704b8bbeSJames Wright }
153704b8bbeSJames Wright 
1548e5e3595SJames Wright // @brief Pack full tensor into Kelvin-Mandel notation symmetric tensor
1558e5e3595SJames Wright CEED_QFUNCTION_HELPER void KMPack(const CeedScalar A[3][3], CeedScalar v[6]) {
1568e5e3595SJames Wright   const CeedScalar weight = sqrt(2.);
1578e5e3595SJames Wright   v[0]                    = A[0][0];
1588e5e3595SJames Wright   v[1]                    = A[1][1];
1598e5e3595SJames Wright   v[2]                    = A[2][2];
1608e5e3595SJames Wright   v[3]                    = A[2][1] * weight;
1618e5e3595SJames Wright   v[4]                    = A[2][0] * weight;
1628e5e3595SJames Wright   v[5]                    = A[1][0] * weight;
1638e5e3595SJames Wright }
1648e5e3595SJames Wright 
1658e5e3595SJames Wright // @brief Calculate metric tensor from mapping, g_{ij} = xi_{k,i} xi_{k,j} = dXdx^T dXdx
1668e5e3595SJames Wright CEED_QFUNCTION_HELPER void KMMetricTensor(const CeedScalar dXdx[3][3], CeedScalar km_g_ij[6]) {
1678e5e3595SJames Wright   CeedScalar g_ij[3][3] = {{0.}};
1688e5e3595SJames Wright   MatMat3(dXdx, dXdx, CEED_TRANSPOSE, CEED_NOTRANSPOSE, g_ij);
1698e5e3595SJames Wright   KMPack(g_ij, km_g_ij);
1708e5e3595SJames Wright }
1718e5e3595SJames Wright 
172e7754af5SKenneth E. Jansen // @brief Linear ramp evaluation
173e7754af5SKenneth E. Jansen CEED_QFUNCTION_HELPER CeedScalar LinearRampCoefficient(CeedScalar amplitude, CeedScalar length, CeedScalar start, CeedScalar x) {
174e7754af5SKenneth E. Jansen   if (x < start) {
175e7754af5SKenneth E. Jansen     return amplitude;
176e7754af5SKenneth E. Jansen   } else if (x < start + length) {
177e7754af5SKenneth E. Jansen     return amplitude * ((x - start) * (-1 / length) + 1);
178e7754af5SKenneth E. Jansen   } else {
179e7754af5SKenneth E. Jansen     return 0;
180e7754af5SKenneth E. Jansen   }
181e7754af5SKenneth E. Jansen }
182e7754af5SKenneth E. Jansen 
183*ade49511SJames Wright /**
184*ade49511SJames Wright   @brief Pack stored values at quadrature point
185*ade49511SJames Wright 
186*ade49511SJames Wright   @param[in]   Q         Number of quadrature points
187*ade49511SJames Wright   @param[in]   i         Current quadrature point
188*ade49511SJames Wright   @param[in]   start     Starting index to store components
189*ade49511SJames Wright   @param[in]   num_comp  Number of components to store
190*ade49511SJames Wright   @param[in]   local     Local values for quadrature point i
191*ade49511SJames Wright   @param[out]  stored    Stored values
192*ade49511SJames Wright 
193*ade49511SJames Wright   @return An error code: 0 - success, otherwise - failure
194*ade49511SJames Wright **/
195*ade49511SJames Wright CEED_QFUNCTION_HELPER int StoredValuesPack(CeedInt Q, CeedInt i, CeedInt start, CeedInt num_comp, const CeedScalar *local, CeedScalar *stored) {
196*ade49511SJames Wright   for (CeedInt j = 0; j < num_comp; j++) stored[(start + j) * Q + i] = local[j];
197*ade49511SJames Wright 
198*ade49511SJames Wright   return CEED_ERROR_SUCCESS;
199*ade49511SJames Wright }
200*ade49511SJames Wright 
201*ade49511SJames Wright /**
202*ade49511SJames Wright   @brief Unpack stored values at quadrature point
203*ade49511SJames Wright 
204*ade49511SJames Wright   @param[in]   Q         Number of quadrature points
205*ade49511SJames Wright   @param[in]   i         Current quadrature point
206*ade49511SJames Wright   @param[in]   start     Starting index to store components
207*ade49511SJames Wright   @param[in]   num_comp  Number of components to store
208*ade49511SJames Wright   @param[in]   stored    Stored values
209*ade49511SJames Wright   @param[out]  local     Local values for quadrature point i
210*ade49511SJames Wright 
211*ade49511SJames Wright   @return An error code: 0 - success, otherwise - failure
212*ade49511SJames Wright **/
213*ade49511SJames Wright CEED_QFUNCTION_HELPER int StoredValuesUnpack(CeedInt Q, CeedInt i, CeedInt start, CeedInt num_comp, const CeedScalar *stored, CeedScalar *local) {
214*ade49511SJames Wright   for (CeedInt j = 0; j < num_comp; j++) local[j] = stored[(start + j) * Q + i];
215*ade49511SJames Wright 
216*ade49511SJames Wright   return CEED_ERROR_SUCCESS;
217*ade49511SJames Wright }
218*ade49511SJames Wright 
219*ade49511SJames Wright /**
220*ade49511SJames Wright   @brief Unpack 3D element q_data at quadrature point
221*ade49511SJames Wright 
222*ade49511SJames Wright   @param[in]   Q         Number of quadrature points
223*ade49511SJames Wright   @param[in]   i         Current quadrature point
224*ade49511SJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:Setup`)
225*ade49511SJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian
226*ade49511SJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [3][3])
227*ade49511SJames Wright 
228*ade49511SJames Wright   @return An error code: 0 - success, otherwise - failure
229*ade49511SJames Wright **/
230*ade49511SJames Wright CEED_QFUNCTION_HELPER int QdataUnpack_3D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[3][3]) {
231*ade49511SJames Wright   StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ);
232*ade49511SJames Wright   StoredValuesUnpack(Q, i, 1, 9, q_data, (CeedScalar *)dXdx);
233*ade49511SJames Wright   return CEED_ERROR_SUCCESS;
234*ade49511SJames Wright }
235*ade49511SJames Wright 
236*ade49511SJames Wright /**
237*ade49511SJames Wright   @brief Unpack boundary element q_data for 3D problem at quadrature point
238*ade49511SJames Wright 
239*ade49511SJames Wright   @param[in]   Q         Number of quadrature points
240*ade49511SJames Wright   @param[in]   i         Current quadrature point
241*ade49511SJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:Setup`)
242*ade49511SJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
243*ade49511SJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [2][3]), or `NULL`
244*ade49511SJames Wright   @param[out]  normal    Components of the normal vector (shape [3]), or `NULL`
245*ade49511SJames Wright 
246*ade49511SJames Wright   @return An error code: 0 - success, otherwise - failure
247*ade49511SJames Wright **/
248*ade49511SJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryUnpack_3D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[2][3],
249*ade49511SJames Wright                                                  CeedScalar normal[3]) {
250*ade49511SJames Wright   if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ);
251*ade49511SJames Wright   if (normal) StoredValuesUnpack(Q, i, 1, 3, q_data, normal);
252*ade49511SJames Wright   if (dXdx) StoredValuesUnpack(Q, i, 4, 6, q_data, (CeedScalar *)dXdx);
253*ade49511SJames Wright   return CEED_ERROR_SUCCESS;
254*ade49511SJames Wright }
255*ade49511SJames Wright 
256704b8bbeSJames Wright #endif  // utils_h
257