1dc936754SJeremy L Thompson // Copyright (c) 2017-2024, Lawrence Livermore National Security, LLC and other CEED contributors. 2704b8bbeSJames Wright // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 3704b8bbeSJames Wright // 4704b8bbeSJames Wright // SPDX-License-Identifier: BSD-2-Clause 5704b8bbeSJames Wright // 6704b8bbeSJames Wright // This file is part of CEED: http://github.com/ceed 7*c7ece6efSJeremy L Thompson #pragma once 8704b8bbeSJames Wright 9704b8bbeSJames Wright #include <ceed.h> 10d0cce58aSJeremy L Thompson #include <math.h> 11704b8bbeSJames Wright 12704b8bbeSJames Wright #ifndef M_PI 13704b8bbeSJames Wright #define M_PI 3.14159265358979323846 14704b8bbeSJames Wright #endif 15704b8bbeSJames Wright 16704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Max(CeedScalar a, CeedScalar b) { return a < b ? b : a; } 17704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Min(CeedScalar a, CeedScalar b) { return a < b ? a : b; } 18704b8bbeSJames Wright 19bfa7851aSJames Wright CEED_QFUNCTION_HELPER void SwapScalar(CeedScalar *a, CeedScalar *b) { 20bfa7851aSJames Wright CeedScalar temp = *a; 21bfa7851aSJames Wright *a = *b; 22bfa7851aSJames Wright *b = temp; 23bfa7851aSJames Wright } 24bfa7851aSJames Wright 25704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Square(CeedScalar x) { return x * x; } 26704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Cube(CeedScalar x) { return x * x * x; } 27704b8bbeSJames Wright 28e7754af5SKenneth E. Jansen // @brief Scale vector of length N by scalar alpha 29e7754af5SKenneth E. Jansen CEED_QFUNCTION_HELPER void ScaleN(CeedScalar *u, const CeedScalar alpha, const CeedInt N) { 308e5e3595SJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) u[i] *= alpha; 318e5e3595SJames Wright } 328e5e3595SJames Wright 338e5e3595SJames Wright // @brief Set vector of length N to a value alpha 348e5e3595SJames Wright CEED_QFUNCTION_HELPER void SetValueN(CeedScalar *u, const CeedScalar alpha, const CeedInt N) { 358e5e3595SJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) u[i] = alpha; 368e5e3595SJames Wright } 378e5e3595SJames Wright 388e5e3595SJames Wright // @brief Copy N elements from x to y 398e5e3595SJames Wright CEED_QFUNCTION_HELPER void CopyN(const CeedScalar *x, CeedScalar *y, const CeedInt N) { CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) y[i] = x[i]; } 408e5e3595SJames Wright 418e5e3595SJames Wright // @brief Copy 3x3 matrix from A to B 428e5e3595SJames Wright CEED_QFUNCTION_HELPER void CopyMat3(const CeedScalar A[3][3], CeedScalar B[3][3]) { CopyN((const CeedScalar *)A, (CeedScalar *)B, 9); } 438e5e3595SJames Wright 448e5e3595SJames Wright // @brief Dot product of vectors with N elements 458e5e3595SJames Wright CEED_QFUNCTION_HELPER CeedScalar DotN(const CeedScalar *u, const CeedScalar *v, const CeedInt N) { 468e5e3595SJames Wright CeedScalar output = 0; 478e5e3595SJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) output += u[i] * v[i]; 488e5e3595SJames Wright return output; 49e7754af5SKenneth E. Jansen } 50e7754af5SKenneth E. Jansen 51704b8bbeSJames Wright // @brief Dot product of 3 element vectors 528fff8293SJames Wright CEED_QFUNCTION_HELPER CeedScalar Dot3(const CeedScalar *u, const CeedScalar *v) { return u[0] * v[0] + u[1] * v[1] + u[2] * v[2]; } 53704b8bbeSJames Wright 548e5e3595SJames Wright // @brief Cross product of vectors with 3 elements 558e5e3595SJames Wright CEED_QFUNCTION_HELPER void Cross3(const CeedScalar u[3], const CeedScalar v[3], CeedScalar w[3]) { 568e5e3595SJames Wright w[0] = (u[1] * v[2]) - (u[2] * v[1]); 578e5e3595SJames Wright w[1] = (u[2] * v[0]) - (u[0] * v[2]); 588e5e3595SJames Wright w[2] = (u[0] * v[1]) - (u[1] * v[0]); 598e5e3595SJames Wright } 608e5e3595SJames Wright 618e5e3595SJames Wright // @brief Curl of vector given its gradient 628e5e3595SJames Wright CEED_QFUNCTION_HELPER void Curl3(const CeedScalar gradient[3][3], CeedScalar v[3]) { 638e5e3595SJames Wright v[0] = gradient[2][1] - gradient[1][2]; 648e5e3595SJames Wright v[1] = gradient[0][2] - gradient[2][0]; 658e5e3595SJames Wright v[2] = gradient[1][0] - gradient[0][1]; 668e5e3595SJames Wright } 678e5e3595SJames Wright 688e5e3595SJames Wright // @brief Matrix vector product, b = Ax + b. A is NxM, x is M, b is N 698e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatVecNM(const CeedScalar *A, const CeedScalar *x, const CeedInt N, const CeedInt M, const CeedTransposeMode transpose_A, 708e5e3595SJames Wright CeedScalar *b) { 718e5e3595SJames Wright switch (transpose_A) { 728e5e3595SJames Wright case CEED_NOTRANSPOSE: 738e5e3595SJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) b[i] += DotN(&A[i * M], x, M); 748e5e3595SJames Wright break; 758e5e3595SJames Wright case CEED_TRANSPOSE: 768e5e3595SJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < M; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) b[i] += A[j * M + i] * x[j]; } 778e5e3595SJames Wright break; 788e5e3595SJames Wright } 798e5e3595SJames Wright } 808e5e3595SJames Wright 818e5e3595SJames Wright // @brief 3x3 Matrix vector product b = Ax + b. 828e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatVec3(const CeedScalar A[3][3], const CeedScalar x[3], const CeedTransposeMode transpose_A, CeedScalar b[3]) { 838e5e3595SJames Wright MatVecNM((const CeedScalar *)A, (const CeedScalar *)x, 3, 3, transpose_A, (CeedScalar *)b); 848e5e3595SJames Wright } 858e5e3595SJames Wright 868e5e3595SJames Wright // @brief Matrix-Matrix product, B = DA + B, where D is diagonal. 878e5e3595SJames Wright // @details A is NxM, D is diagonal NxN, represented by a vector of length N, and B is NxM. Optionally, A may be transposed. 888e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatDiagNM(const CeedScalar *A, const CeedScalar *D, const CeedInt N, const CeedInt M, const CeedTransposeMode transpose_A, 898e5e3595SJames Wright CeedScalar *B) { 908e5e3595SJames Wright switch (transpose_A) { 918e5e3595SJames Wright case CEED_NOTRANSPOSE: 928e5e3595SJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < M; j++) B[i * M + j] += D[i] * A[i * M + j]; } 938e5e3595SJames Wright break; 948e5e3595SJames Wright case CEED_TRANSPOSE: 958e5e3595SJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < M; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) B[i * N + j] += D[i] * A[j * M + i]; } 968e5e3595SJames Wright break; 978e5e3595SJames Wright } 988e5e3595SJames Wright } 998e5e3595SJames Wright 1008e5e3595SJames Wright // @brief 3x3 Matrix-Matrix product, B = DA + B, where D is diagonal. 1018e5e3595SJames Wright // @details Optionally, A may be transposed. 1028e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatDiag3(const CeedScalar A[3][3], const CeedScalar D[3], const CeedTransposeMode transpose_A, CeedScalar B[3][3]) { 1038e5e3595SJames Wright MatDiagNM((const CeedScalar *)A, (const CeedScalar *)D, 3, 3, transpose_A, (CeedScalar *)B); 1048e5e3595SJames Wright } 105e975cfccSJames Wright // @brief NxN Matrix-Matrix product, C = AB + C 106e975cfccSJames Wright CEED_QFUNCTION_HELPER void MatMatN(const CeedScalar *A, const CeedScalar *B, const CeedInt N, const CeedTransposeMode transpose_A, 107e975cfccSJames Wright const CeedTransposeMode transpose_B, CeedScalar *C) { 1088e5e3595SJames Wright switch (transpose_A) { 1098e5e3595SJames Wright case CEED_NOTRANSPOSE: 1108e5e3595SJames Wright switch (transpose_B) { 1118e5e3595SJames Wright case CEED_NOTRANSPOSE: 112e975cfccSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) { 113e975cfccSJames Wright CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) { 114e975cfccSJames Wright CeedPragmaSIMD for (CeedInt k = 0; k < N; k++) C[i * N + j] += A[i * N + k] * B[k * N + j]; 115e975cfccSJames Wright } 1168e5e3595SJames Wright } 1178e5e3595SJames Wright break; 1188e5e3595SJames Wright case CEED_TRANSPOSE: 119e975cfccSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) { 120e975cfccSJames Wright CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) { 121e975cfccSJames Wright CeedPragmaSIMD for (CeedInt k = 0; k < N; k++) C[i * N + j] += A[i * N + k] * B[j * N + k]; 122e975cfccSJames Wright } 1238e5e3595SJames Wright } 1248e5e3595SJames Wright break; 1258e5e3595SJames Wright } 1268e5e3595SJames Wright break; 1278e5e3595SJames Wright case CEED_TRANSPOSE: 1288e5e3595SJames Wright switch (transpose_B) { 1298e5e3595SJames Wright case CEED_NOTRANSPOSE: 130e975cfccSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) { 131e975cfccSJames Wright CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) { 132e975cfccSJames Wright CeedPragmaSIMD for (CeedInt k = 0; k < N; k++) C[i * N + j] += A[k * N + i] * B[k * N + j]; 133e975cfccSJames Wright } 1348e5e3595SJames Wright } 1358e5e3595SJames Wright break; 1368e5e3595SJames Wright case CEED_TRANSPOSE: 137e975cfccSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) { 138e975cfccSJames Wright CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) { 139e975cfccSJames Wright CeedPragmaSIMD for (CeedInt k = 0; k < N; k++) C[i * N + j] += A[k * N + i] * B[j * N + k]; 140e975cfccSJames Wright } 1418e5e3595SJames Wright } 1428e5e3595SJames Wright break; 1438e5e3595SJames Wright } 1448e5e3595SJames Wright break; 1458e5e3595SJames Wright } 1468e5e3595SJames Wright } 1478e5e3595SJames Wright 148e975cfccSJames Wright // @brief 3x3 Matrix-Matrix product, C = AB + C 149e975cfccSJames Wright CEED_QFUNCTION_HELPER void MatMat3(const CeedScalar A[3][3], const CeedScalar B[3][3], const CeedTransposeMode transpose_A, 150e975cfccSJames Wright const CeedTransposeMode transpose_B, CeedScalar C[3][3]) { 151e975cfccSJames Wright MatMatN((const CeedScalar *)A, (const CeedScalar *)B, 3, transpose_A, transpose_B, (CeedScalar *)C); 152e975cfccSJames Wright } 153e975cfccSJames Wright 154704b8bbeSJames Wright // @brief Unpack Kelvin-Mandel notation symmetric tensor into full tensor 155704b8bbeSJames Wright CEED_QFUNCTION_HELPER void KMUnpack(const CeedScalar v[6], CeedScalar A[3][3]) { 156704b8bbeSJames Wright const CeedScalar weight = 1 / sqrt(2.); 157704b8bbeSJames Wright A[0][0] = v[0]; 158704b8bbeSJames Wright A[1][1] = v[1]; 159704b8bbeSJames Wright A[2][2] = v[2]; 160704b8bbeSJames Wright A[2][1] = A[1][2] = weight * v[3]; 161704b8bbeSJames Wright A[2][0] = A[0][2] = weight * v[4]; 162704b8bbeSJames Wright A[1][0] = A[0][1] = weight * v[5]; 163704b8bbeSJames Wright } 164704b8bbeSJames Wright 1658e5e3595SJames Wright // @brief Pack full tensor into Kelvin-Mandel notation symmetric tensor 1668e5e3595SJames Wright CEED_QFUNCTION_HELPER void KMPack(const CeedScalar A[3][3], CeedScalar v[6]) { 1678e5e3595SJames Wright const CeedScalar weight = sqrt(2.); 1688e5e3595SJames Wright v[0] = A[0][0]; 1698e5e3595SJames Wright v[1] = A[1][1]; 1708e5e3595SJames Wright v[2] = A[2][2]; 1718e5e3595SJames Wright v[3] = A[2][1] * weight; 1728e5e3595SJames Wright v[4] = A[2][0] * weight; 1738e5e3595SJames Wright v[5] = A[1][0] * weight; 1748e5e3595SJames Wright } 1758e5e3595SJames Wright 1768e5e3595SJames Wright // @brief Calculate metric tensor from mapping, g_{ij} = xi_{k,i} xi_{k,j} = dXdx^T dXdx 1778e5e3595SJames Wright CEED_QFUNCTION_HELPER void KMMetricTensor(const CeedScalar dXdx[3][3], CeedScalar km_g_ij[6]) { 1788e5e3595SJames Wright CeedScalar g_ij[3][3] = {{0.}}; 1798e5e3595SJames Wright MatMat3(dXdx, dXdx, CEED_TRANSPOSE, CEED_NOTRANSPOSE, g_ij); 1808e5e3595SJames Wright KMPack(g_ij, km_g_ij); 1818e5e3595SJames Wright } 1828e5e3595SJames Wright 183e7754af5SKenneth E. Jansen // @brief Linear ramp evaluation 184e7754af5SKenneth E. Jansen CEED_QFUNCTION_HELPER CeedScalar LinearRampCoefficient(CeedScalar amplitude, CeedScalar length, CeedScalar start, CeedScalar x) { 185e7754af5SKenneth E. Jansen if (x < start) { 186e7754af5SKenneth E. Jansen return amplitude; 187e7754af5SKenneth E. Jansen } else if (x < start + length) { 188e7754af5SKenneth E. Jansen return amplitude * ((x - start) * (-1 / length) + 1); 189e7754af5SKenneth E. Jansen } else { 190e7754af5SKenneth E. Jansen return 0; 191e7754af5SKenneth E. Jansen } 192e7754af5SKenneth E. Jansen } 193e7754af5SKenneth E. Jansen 194ade49511SJames Wright /** 195ade49511SJames Wright @brief Pack stored values at quadrature point 196ade49511SJames Wright 197ade49511SJames Wright @param[in] Q Number of quadrature points 198ade49511SJames Wright @param[in] i Current quadrature point 199ade49511SJames Wright @param[in] start Starting index to store components 200ade49511SJames Wright @param[in] num_comp Number of components to store 2016764667bSJames Wright @param[in] values_at_qpnt Local values for quadrature point i 202ade49511SJames Wright @param[out] stored Stored values 203ade49511SJames Wright 204ade49511SJames Wright @return An error code: 0 - success, otherwise - failure 205ade49511SJames Wright **/ 2066764667bSJames Wright CEED_QFUNCTION_HELPER int StoredValuesPack(CeedInt Q, CeedInt i, CeedInt start, CeedInt num_comp, const CeedScalar *values_at_qpnt, 2076764667bSJames Wright CeedScalar *stored) { 2086764667bSJames Wright for (CeedInt j = 0; j < num_comp; j++) stored[(start + j) * Q + i] = values_at_qpnt[j]; 209ade49511SJames Wright 210ade49511SJames Wright return CEED_ERROR_SUCCESS; 211ade49511SJames Wright } 212ade49511SJames Wright 213ade49511SJames Wright /** 214ade49511SJames Wright @brief Unpack stored values at quadrature point 215ade49511SJames Wright 216ade49511SJames Wright @param[in] Q Number of quadrature points 217ade49511SJames Wright @param[in] i Current quadrature point 218ade49511SJames Wright @param[in] start Starting index to store components 219ade49511SJames Wright @param[in] num_comp Number of components to store 220ade49511SJames Wright @param[in] stored Stored values 2216764667bSJames Wright @param[out] values_at_qpnt Local values for quadrature point i 222ade49511SJames Wright 223ade49511SJames Wright @return An error code: 0 - success, otherwise - failure 224ade49511SJames Wright **/ 2256764667bSJames Wright CEED_QFUNCTION_HELPER int StoredValuesUnpack(CeedInt Q, CeedInt i, CeedInt start, CeedInt num_comp, const CeedScalar *stored, 2266764667bSJames Wright CeedScalar *values_at_qpnt) { 2276764667bSJames Wright for (CeedInt j = 0; j < num_comp; j++) values_at_qpnt[j] = stored[(start + j) * Q + i]; 228ade49511SJames Wright 229ade49511SJames Wright return CEED_ERROR_SUCCESS; 230ade49511SJames Wright } 231ade49511SJames Wright 232ade49511SJames Wright /** 233ade49511SJames Wright @brief Unpack 3D element q_data at quadrature point 234ade49511SJames Wright 235ade49511SJames Wright @param[in] Q Number of quadrature points 236ade49511SJames Wright @param[in] i Current quadrature point 237ade49511SJames Wright @param[in] q_data Pointer to q_data (generated by `setupgeo.h:Setup`) 238ade49511SJames Wright @param[out] wdetJ Quadrature weight times determinant of the mapping Jacobian 239ade49511SJames Wright @param[out] dXdx Inverse of the mapping Jacobian (shape [3][3]) 240ade49511SJames Wright 241ade49511SJames Wright @return An error code: 0 - success, otherwise - failure 242ade49511SJames Wright **/ 243ade49511SJames Wright CEED_QFUNCTION_HELPER int QdataUnpack_3D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[3][3]) { 244ade49511SJames Wright StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ); 245ade49511SJames Wright StoredValuesUnpack(Q, i, 1, 9, q_data, (CeedScalar *)dXdx); 246ade49511SJames Wright return CEED_ERROR_SUCCESS; 247ade49511SJames Wright } 248ade49511SJames Wright 249ade49511SJames Wright /** 250ade49511SJames Wright @brief Unpack boundary element q_data for 3D problem at quadrature point 251ade49511SJames Wright 252ade49511SJames Wright @param[in] Q Number of quadrature points 253ade49511SJames Wright @param[in] i Current quadrature point 2542c512a7bSJames Wright @param[in] q_data Pointer to q_data (generated by `setupgeo.h:SetupBoundary`) 255ade49511SJames Wright @param[out] wdetJ Quadrature weight times determinant of the mapping Jacobian, or `NULL` 256ade49511SJames Wright @param[out] dXdx Inverse of the mapping Jacobian (shape [2][3]), or `NULL` 257ade49511SJames Wright @param[out] normal Components of the normal vector (shape [3]), or `NULL` 258ade49511SJames Wright 259ade49511SJames Wright @return An error code: 0 - success, otherwise - failure 260ade49511SJames Wright **/ 261ade49511SJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryUnpack_3D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[2][3], 262ade49511SJames Wright CeedScalar normal[3]) { 263ade49511SJames Wright if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ); 264ade49511SJames Wright if (normal) StoredValuesUnpack(Q, i, 1, 3, q_data, normal); 265ade49511SJames Wright if (dXdx) StoredValuesUnpack(Q, i, 4, 6, q_data, (CeedScalar *)dXdx); 266ade49511SJames Wright return CEED_ERROR_SUCCESS; 267ade49511SJames Wright } 268ade49511SJames Wright 269baadde1fSJames Wright /** 270baadde1fSJames Wright @brief Unpack 2D element q_data at quadrature point 271baadde1fSJames Wright 272baadde1fSJames Wright @param[in] Q Number of quadrature points 273baadde1fSJames Wright @param[in] i Current quadrature point 274baadde1fSJames Wright @param[in] q_data Pointer to q_data (generated by `setupgeo.h:Setup`) 275baadde1fSJames Wright @param[out] wdetJ Quadrature weight times determinant of the mapping Jacobian 276baadde1fSJames Wright @param[out] dXdx Inverse of the mapping Jacobian (shape [2][2]) 277baadde1fSJames Wright 278baadde1fSJames Wright @return An error code: 0 - success, otherwise - failure 279baadde1fSJames Wright **/ 280baadde1fSJames Wright CEED_QFUNCTION_HELPER int QdataUnpack_2D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[2][2]) { 281baadde1fSJames Wright StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ); 282baadde1fSJames Wright StoredValuesUnpack(Q, i, 1, 4, q_data, (CeedScalar *)dXdx); 283baadde1fSJames Wright return CEED_ERROR_SUCCESS; 284baadde1fSJames Wright } 285baadde1fSJames Wright 2862c512a7bSJames Wright /** 2872c512a7bSJames Wright @brief Unpack boundary element q_data for 2D problem at quadrature point 2882c512a7bSJames Wright 2892c512a7bSJames Wright @param[in] Q Number of quadrature points 2902c512a7bSJames Wright @param[in] i Current quadrature point 2912c512a7bSJames Wright @param[in] q_data Pointer to q_data (generated by `setupgeo.h:SetupBoundary2d`) 2922c512a7bSJames Wright @param[out] wdetJ Quadrature weight times determinant of the mapping Jacobian, or `NULL` 2932c512a7bSJames Wright @param[out] normal Components of the normal vector (shape [2]), or `NULL` 2942c512a7bSJames Wright 2952c512a7bSJames Wright @return An error code: 0 - success, otherwise - failure 2962c512a7bSJames Wright **/ 2972c512a7bSJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryUnpack_2D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar normal[2]) { 2982c512a7bSJames Wright if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ); 2992c512a7bSJames Wright if (normal) StoredValuesUnpack(Q, i, 1, 2, q_data, normal); 3002c512a7bSJames Wright return CEED_ERROR_SUCCESS; 3012c512a7bSJames Wright } 302