113fa47b2SJames Wright // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors. 213fa47b2SJames Wright // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 313fa47b2SJames Wright // 413fa47b2SJames Wright // SPDX-License-Identifier: BSD-2-Clause 513fa47b2SJames Wright // 613fa47b2SJames Wright // This file is part of CEED: http://github.com/ceed 713fa47b2SJames Wright 813fa47b2SJames Wright #ifndef utils_h 913fa47b2SJames Wright #define utils_h 1013fa47b2SJames Wright 1113fa47b2SJames Wright #include <ceed.h> 12c9c2c079SJeremy L Thompson #include <math.h> 1313fa47b2SJames Wright 1413fa47b2SJames Wright #ifndef M_PI 1513fa47b2SJames Wright #define M_PI 3.14159265358979323846 1613fa47b2SJames Wright #endif 1713fa47b2SJames Wright 1813fa47b2SJames Wright CEED_QFUNCTION_HELPER CeedScalar Max(CeedScalar a, CeedScalar b) { return a < b ? b : a; } 1913fa47b2SJames Wright CEED_QFUNCTION_HELPER CeedScalar Min(CeedScalar a, CeedScalar b) { return a < b ? a : b; } 2013fa47b2SJames Wright 21dc9b5c4aSJames Wright CEED_QFUNCTION_HELPER void SwapScalar(CeedScalar *a, CeedScalar *b) { 22dc9b5c4aSJames Wright CeedScalar temp = *a; 23dc9b5c4aSJames Wright *a = *b; 24dc9b5c4aSJames Wright *b = temp; 25dc9b5c4aSJames Wright } 26dc9b5c4aSJames Wright 2713fa47b2SJames Wright CEED_QFUNCTION_HELPER CeedScalar Square(CeedScalar x) { return x * x; } 2813fa47b2SJames Wright CEED_QFUNCTION_HELPER CeedScalar Cube(CeedScalar x) { return x * x * x; } 2913fa47b2SJames Wright 30530ad8c4SKenneth E. Jansen // @brief Scale vector of length N by scalar alpha 31530ad8c4SKenneth E. Jansen CEED_QFUNCTION_HELPER void ScaleN(CeedScalar *u, const CeedScalar alpha, const CeedInt N) { 32*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) u[i] *= alpha; 33*a455f92dSJames Wright } 34*a455f92dSJames Wright 35*a455f92dSJames Wright // @brief Set vector of length N to a value alpha 36*a455f92dSJames Wright CEED_QFUNCTION_HELPER void SetValueN(CeedScalar *u, const CeedScalar alpha, const CeedInt N) { 37*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) u[i] = alpha; 38*a455f92dSJames Wright } 39*a455f92dSJames Wright 40*a455f92dSJames Wright // @brief Copy N elements from x to y 41*a455f92dSJames Wright CEED_QFUNCTION_HELPER void CopyN(const CeedScalar *x, CeedScalar *y, const CeedInt N) { CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) y[i] = x[i]; } 42*a455f92dSJames Wright 43*a455f92dSJames Wright // @brief Copy 3x3 matrix from A to B 44*a455f92dSJames Wright CEED_QFUNCTION_HELPER void CopyMat3(const CeedScalar A[3][3], CeedScalar B[3][3]) { CopyN((const CeedScalar *)A, (CeedScalar *)B, 9); } 45*a455f92dSJames Wright 46*a455f92dSJames Wright // @brief Dot product of vectors with N elements 47*a455f92dSJames Wright CEED_QFUNCTION_HELPER CeedScalar DotN(const CeedScalar *u, const CeedScalar *v, const CeedInt N) { 48*a455f92dSJames Wright CeedScalar output = 0; 49*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) output += u[i] * v[i]; 50*a455f92dSJames Wright return output; 51530ad8c4SKenneth E. Jansen } 52530ad8c4SKenneth E. Jansen 5313fa47b2SJames Wright // @brief Dot product of 3 element vectors 542b730f8bSJeremy L Thompson CEED_QFUNCTION_HELPER CeedScalar Dot3(const CeedScalar u[3], const CeedScalar v[3]) { return u[0] * v[0] + u[1] * v[1] + u[2] * v[2]; } 5513fa47b2SJames Wright 56*a455f92dSJames Wright // @brief Cross product of vectors with 3 elements 57*a455f92dSJames Wright CEED_QFUNCTION_HELPER void Cross3(const CeedScalar u[3], const CeedScalar v[3], CeedScalar w[3]) { 58*a455f92dSJames Wright w[0] = (u[1] * v[2]) - (u[2] * v[1]); 59*a455f92dSJames Wright w[1] = (u[2] * v[0]) - (u[0] * v[2]); 60*a455f92dSJames Wright w[2] = (u[0] * v[1]) - (u[1] * v[0]); 61*a455f92dSJames Wright } 62*a455f92dSJames Wright 63*a455f92dSJames Wright // @brief Curl of vector given its gradient 64*a455f92dSJames Wright CEED_QFUNCTION_HELPER void Curl3(const CeedScalar gradient[3][3], CeedScalar v[3]) { 65*a455f92dSJames Wright v[0] = gradient[2][1] - gradient[1][2]; 66*a455f92dSJames Wright v[1] = gradient[0][2] - gradient[2][0]; 67*a455f92dSJames Wright v[2] = gradient[1][0] - gradient[0][1]; 68*a455f92dSJames Wright } 69*a455f92dSJames Wright 70*a455f92dSJames Wright // @brief Matrix vector product, b = Ax + b. A is NxM, x is M, b is N 71*a455f92dSJames Wright CEED_QFUNCTION_HELPER void MatVecNM(const CeedScalar *A, const CeedScalar *x, const CeedInt N, const CeedInt M, const CeedTransposeMode transpose_A, 72*a455f92dSJames Wright CeedScalar *b) { 73*a455f92dSJames Wright switch (transpose_A) { 74*a455f92dSJames Wright case CEED_NOTRANSPOSE: 75*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) b[i] += DotN(&A[i * M], x, M); 76*a455f92dSJames Wright break; 77*a455f92dSJames Wright case CEED_TRANSPOSE: 78*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < M; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) b[i] += A[j * M + i] * x[j]; } 79*a455f92dSJames Wright break; 80*a455f92dSJames Wright } 81*a455f92dSJames Wright } 82*a455f92dSJames Wright 83*a455f92dSJames Wright // @brief 3x3 Matrix vector product b = Ax + b. 84*a455f92dSJames Wright CEED_QFUNCTION_HELPER void MatVec3(const CeedScalar A[3][3], const CeedScalar x[3], const CeedTransposeMode transpose_A, CeedScalar b[3]) { 85*a455f92dSJames Wright MatVecNM((const CeedScalar *)A, (const CeedScalar *)x, 3, 3, transpose_A, (CeedScalar *)b); 86*a455f92dSJames Wright } 87*a455f92dSJames Wright 88*a455f92dSJames Wright // @brief Matrix-Matrix product, B = DA + B, where D is diagonal. 89*a455f92dSJames Wright // @details A is NxM, D is diagonal NxN, represented by a vector of length N, and B is NxM. Optionally, A may be transposed. 90*a455f92dSJames Wright CEED_QFUNCTION_HELPER void MatDiagNM(const CeedScalar *A, const CeedScalar *D, const CeedInt N, const CeedInt M, const CeedTransposeMode transpose_A, 91*a455f92dSJames Wright CeedScalar *B) { 92*a455f92dSJames Wright switch (transpose_A) { 93*a455f92dSJames Wright case CEED_NOTRANSPOSE: 94*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < M; j++) B[i * M + j] += D[i] * A[i * M + j]; } 95*a455f92dSJames Wright break; 96*a455f92dSJames Wright case CEED_TRANSPOSE: 97*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < M; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) B[i * N + j] += D[i] * A[j * M + i]; } 98*a455f92dSJames Wright break; 99*a455f92dSJames Wright } 100*a455f92dSJames Wright } 101*a455f92dSJames Wright 102*a455f92dSJames Wright // @brief 3x3 Matrix-Matrix product, B = DA + B, where D is diagonal. 103*a455f92dSJames Wright // @details Optionally, A may be transposed. 104*a455f92dSJames Wright CEED_QFUNCTION_HELPER void MatDiag3(const CeedScalar A[3][3], const CeedScalar D[3], const CeedTransposeMode transpose_A, CeedScalar B[3][3]) { 105*a455f92dSJames Wright MatDiagNM((const CeedScalar *)A, (const CeedScalar *)D, 3, 3, transpose_A, (CeedScalar *)B); 106*a455f92dSJames Wright } 107*a455f92dSJames Wright 108*a455f92dSJames Wright // @brief 3x3 Matrix-Matrix product, C = AB + C 109*a455f92dSJames Wright CEED_QFUNCTION_HELPER void MatMat3(const CeedScalar A[3][3], const CeedScalar B[3][3], const CeedTransposeMode transpose_A, 110*a455f92dSJames Wright const CeedTransposeMode transpose_B, CeedScalar C[3][3]) { 111*a455f92dSJames Wright switch (transpose_A) { 112*a455f92dSJames Wright case CEED_NOTRANSPOSE: 113*a455f92dSJames Wright switch (transpose_B) { 114*a455f92dSJames Wright case CEED_NOTRANSPOSE: 115*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < 3; i++) { 116*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt j = 0; j < 3; j++) { CeedPragmaSIMD for (CeedInt k = 0; k < 3; k++) C[i][j] += A[i][k] * B[k][j]; } 117*a455f92dSJames Wright } 118*a455f92dSJames Wright break; 119*a455f92dSJames Wright case CEED_TRANSPOSE: 120*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < 3; i++) { 121*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt j = 0; j < 3; j++) { CeedPragmaSIMD for (CeedInt k = 0; k < 3; k++) C[i][j] += A[i][k] * B[j][k]; } 122*a455f92dSJames Wright } 123*a455f92dSJames Wright break; 124*a455f92dSJames Wright } 125*a455f92dSJames Wright break; 126*a455f92dSJames Wright case CEED_TRANSPOSE: 127*a455f92dSJames Wright switch (transpose_B) { 128*a455f92dSJames Wright case CEED_NOTRANSPOSE: 129*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < 3; i++) { 130*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt j = 0; j < 3; j++) { CeedPragmaSIMD for (CeedInt k = 0; k < 3; k++) C[i][j] += A[k][i] * B[k][j]; } 131*a455f92dSJames Wright } 132*a455f92dSJames Wright break; 133*a455f92dSJames Wright case CEED_TRANSPOSE: 134*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < 3; i++) { 135*a455f92dSJames Wright CeedPragmaSIMD for (CeedInt j = 0; j < 3; j++) { CeedPragmaSIMD for (CeedInt k = 0; k < 3; k++) C[i][j] += A[k][i] * B[j][k]; } 136*a455f92dSJames Wright } 137*a455f92dSJames Wright break; 138*a455f92dSJames Wright } 139*a455f92dSJames Wright break; 140*a455f92dSJames Wright } 141*a455f92dSJames Wright } 142*a455f92dSJames Wright 14313fa47b2SJames Wright // @brief Unpack Kelvin-Mandel notation symmetric tensor into full tensor 14413fa47b2SJames Wright CEED_QFUNCTION_HELPER void KMUnpack(const CeedScalar v[6], CeedScalar A[3][3]) { 14513fa47b2SJames Wright const CeedScalar weight = 1 / sqrt(2.); 14613fa47b2SJames Wright A[0][0] = v[0]; 14713fa47b2SJames Wright A[1][1] = v[1]; 14813fa47b2SJames Wright A[2][2] = v[2]; 14913fa47b2SJames Wright A[2][1] = A[1][2] = weight * v[3]; 15013fa47b2SJames Wright A[2][0] = A[0][2] = weight * v[4]; 15113fa47b2SJames Wright A[1][0] = A[0][1] = weight * v[5]; 15213fa47b2SJames Wright } 15313fa47b2SJames Wright 154*a455f92dSJames Wright // @brief Pack full tensor into Kelvin-Mandel notation symmetric tensor 155*a455f92dSJames Wright CEED_QFUNCTION_HELPER void KMPack(const CeedScalar A[3][3], CeedScalar v[6]) { 156*a455f92dSJames Wright const CeedScalar weight = sqrt(2.); 157*a455f92dSJames Wright v[0] = A[0][0]; 158*a455f92dSJames Wright v[1] = A[1][1]; 159*a455f92dSJames Wright v[2] = A[2][2]; 160*a455f92dSJames Wright v[3] = A[2][1] * weight; 161*a455f92dSJames Wright v[4] = A[2][0] * weight; 162*a455f92dSJames Wright v[5] = A[1][0] * weight; 163*a455f92dSJames Wright } 164*a455f92dSJames Wright 165*a455f92dSJames Wright // @brief Calculate metric tensor from mapping, g_{ij} = xi_{k,i} xi_{k,j} = dXdx^T dXdx 166*a455f92dSJames Wright CEED_QFUNCTION_HELPER void KMMetricTensor(const CeedScalar dXdx[3][3], CeedScalar km_g_ij[6]) { 167*a455f92dSJames Wright CeedScalar g_ij[3][3] = {{0.}}; 168*a455f92dSJames Wright MatMat3(dXdx, dXdx, CEED_TRANSPOSE, CEED_NOTRANSPOSE, g_ij); 169*a455f92dSJames Wright KMPack(g_ij, km_g_ij); 170*a455f92dSJames Wright } 171*a455f92dSJames Wright 172530ad8c4SKenneth E. Jansen // @brief Linear ramp evaluation 173530ad8c4SKenneth E. Jansen CEED_QFUNCTION_HELPER CeedScalar LinearRampCoefficient(CeedScalar amplitude, CeedScalar length, CeedScalar start, CeedScalar x) { 174530ad8c4SKenneth E. Jansen if (x < start) { 175530ad8c4SKenneth E. Jansen return amplitude; 176530ad8c4SKenneth E. Jansen } else if (x < start + length) { 177530ad8c4SKenneth E. Jansen return amplitude * ((x - start) * (-1 / length) + 1); 178530ad8c4SKenneth E. Jansen } else { 179530ad8c4SKenneth E. Jansen return 0; 180530ad8c4SKenneth E. Jansen } 181530ad8c4SKenneth E. Jansen } 182530ad8c4SKenneth E. Jansen 18313fa47b2SJames Wright #endif // utils_h 184