115ed3f7dSjeremylt /// @file 215ed3f7dSjeremylt /// Test creation and use of FDM element inverse 315ed3f7dSjeremylt /// \test Test creation and use of FDM element inverse 42b730f8bSJeremy L Thompson #include "t541-operator.h" 52b730f8bSJeremy L Thompson 615ed3f7dSjeremylt #include <ceed.h> 72b730f8bSJeremy L Thompson #include <math.h> 849aac155SJeremy L Thompson #include <stdio.h> 915ed3f7dSjeremylt #include <stdlib.h> 1015ed3f7dSjeremylt #include <string.h> 1115ed3f7dSjeremylt 1215ed3f7dSjeremylt int main(int argc, char **argv) { 1315ed3f7dSjeremylt Ceed ceed; 144fee36f0SJeremy L Thompson CeedElemRestriction elem_restriction_x, elem_restriction_u, elem_restriction_q_data; 1515ed3f7dSjeremylt CeedBasis basis_x, basis_u; 1615ed3f7dSjeremylt CeedQFunction qf_setup_diff, qf_apply; 174fee36f0SJeremy L Thompson CeedOperator op_setup_diff, op_apply, op_inverse; 184fee36f0SJeremy L Thompson CeedVector q_data_diff, x, u, v, w; 194fee36f0SJeremy L Thompson CeedInt num_elem = 1, p = 4, q = 5, dim = 2; 204fee36f0SJeremy L Thompson CeedInt num_dofs = p * p, num_qpts = num_elem * q * q, q_data_size = dim * (dim + 1) / 2; 2115ed3f7dSjeremylt 2215ed3f7dSjeremylt CeedInit(argv[1], &ceed); 2315ed3f7dSjeremylt 2480a9ef05SNatalie Beams // Test skipped if using single precision 252b730f8bSJeremy L Thompson if (CEED_SCALAR_TYPE == CEED_SCALAR_FP32) return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Test not implemented in single precision"); 2680a9ef05SNatalie Beams 274fee36f0SJeremy L Thompson // Vectors 284fee36f0SJeremy L Thompson CeedVectorCreate(ceed, dim * num_elem * (2 * 2), &x); 294fee36f0SJeremy L Thompson { 304fee36f0SJeremy L Thompson CeedScalar x_array[dim * num_elem * (2 * 2)]; 314fee36f0SJeremy L Thompson 322b730f8bSJeremy L Thompson for (CeedInt i = 0; i < 2; i++) { 3315ed3f7dSjeremylt for (CeedInt j = 0; j < 2; j++) { 344fee36f0SJeremy L Thompson x_array[i + j * 2 + 0 * 4] = i; 354fee36f0SJeremy L Thompson x_array[i + j * 2 + 1 * 4] = j; 3615ed3f7dSjeremylt } 372b730f8bSJeremy L Thompson } 384fee36f0SJeremy L Thompson CeedVectorSetArray(x, CEED_MEM_HOST, CEED_COPY_VALUES, x_array); 394fee36f0SJeremy L Thompson } 404fee36f0SJeremy L Thompson CeedVectorCreate(ceed, num_dofs, &u); 414fee36f0SJeremy L Thompson CeedVectorCreate(ceed, num_dofs, &v); 424fee36f0SJeremy L Thompson CeedVectorCreate(ceed, num_dofs, &w); 4315ed3f7dSjeremylt CeedVectorCreate(ceed, q_data_size * num_qpts, &q_data_diff); 4415ed3f7dSjeremylt 4515ed3f7dSjeremylt // Restrictions 4615ed3f7dSjeremylt CeedInt strides_x[3] = {1, 2 * 2, 2 * 2 * dim}; 474fee36f0SJeremy L Thompson CeedElemRestrictionCreateStrided(ceed, num_elem, 2 * 2, dim, dim * num_elem * 2 * 2, strides_x, &elem_restriction_x); 4815ed3f7dSjeremylt 494fee36f0SJeremy L Thompson CeedInt strides_u[3] = {1, p * p, p * p}; 504fee36f0SJeremy L Thompson CeedElemRestrictionCreateStrided(ceed, num_elem, p * p, 1, num_dofs, strides_u, &elem_restriction_u); 5115ed3f7dSjeremylt 524fee36f0SJeremy L Thompson CeedInt strides_q_data[3] = {1, q * q, q_data_size * q * q}; 534fee36f0SJeremy L Thompson CeedElemRestrictionCreateStrided(ceed, num_elem, q * q, q_data_size, num_qpts * q_data_size, strides_q_data, &elem_restriction_q_data); 5415ed3f7dSjeremylt 5515ed3f7dSjeremylt // Bases 564fee36f0SJeremy L Thompson CeedBasisCreateTensorH1Lagrange(ceed, dim, dim, 2, q, CEED_GAUSS, &basis_x); 574fee36f0SJeremy L Thompson CeedBasisCreateTensorH1Lagrange(ceed, dim, 1, p, q, CEED_GAUSS, &basis_u); 5815ed3f7dSjeremylt 5915ed3f7dSjeremylt // QFunction - setup diff 602b730f8bSJeremy L Thompson CeedQFunctionCreateInterior(ceed, 1, setup_diff, setup_diff_loc, &qf_setup_diff); 6115ed3f7dSjeremylt CeedQFunctionAddInput(qf_setup_diff, "dx", dim * dim, CEED_EVAL_GRAD); 6215ed3f7dSjeremylt CeedQFunctionAddInput(qf_setup_diff, "weight", 1, CEED_EVAL_WEIGHT); 6315ed3f7dSjeremylt CeedQFunctionAddOutput(qf_setup_diff, "q data", q_data_size, CEED_EVAL_NONE); 6415ed3f7dSjeremylt 6515ed3f7dSjeremylt // Operator - setup diff 662b730f8bSJeremy L Thompson CeedOperatorCreate(ceed, qf_setup_diff, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, &op_setup_diff); 674fee36f0SJeremy L Thompson CeedOperatorSetField(op_setup_diff, "dx", elem_restriction_x, basis_x, CEED_VECTOR_ACTIVE); 682b730f8bSJeremy L Thompson CeedOperatorSetField(op_setup_diff, "weight", CEED_ELEMRESTRICTION_NONE, basis_x, CEED_VECTOR_NONE); 69*356036faSJeremy L Thompson CeedOperatorSetField(op_setup_diff, "q data", elem_restriction_q_data, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE); 7015ed3f7dSjeremylt 7115ed3f7dSjeremylt // Apply Setup Operator 724fee36f0SJeremy L Thompson CeedOperatorApply(op_setup_diff, x, q_data_diff, CEED_REQUEST_IMMEDIATE); 7315ed3f7dSjeremylt 7415ed3f7dSjeremylt // QFunction - apply 7515ed3f7dSjeremylt CeedQFunctionCreateInterior(ceed, 1, apply, apply_loc, &qf_apply); 7615ed3f7dSjeremylt CeedQFunctionAddInput(qf_apply, "u", dim, CEED_EVAL_GRAD); 774fee36f0SJeremy L Thompson CeedQFunctionAddInput(qf_apply, "q data diff", q_data_size, CEED_EVAL_NONE); 7815ed3f7dSjeremylt CeedQFunctionAddOutput(qf_apply, "v", dim, CEED_EVAL_GRAD); 7915ed3f7dSjeremylt 8015ed3f7dSjeremylt // Operator - apply 812b730f8bSJeremy L Thompson CeedOperatorCreate(ceed, qf_apply, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, &op_apply); 824fee36f0SJeremy L Thompson CeedOperatorSetField(op_apply, "u", elem_restriction_u, basis_u, CEED_VECTOR_ACTIVE); 83*356036faSJeremy L Thompson CeedOperatorSetField(op_apply, "q data diff", elem_restriction_q_data, CEED_BASIS_NONE, q_data_diff); 844fee36f0SJeremy L Thompson CeedOperatorSetField(op_apply, "v", elem_restriction_u, basis_u, CEED_VECTOR_ACTIVE); 8515ed3f7dSjeremylt 8615ed3f7dSjeremylt // Create FDM element inverse 874fee36f0SJeremy L Thompson CeedOperatorCreateFDMElementInverse(op_apply, &op_inverse, CEED_REQUEST_IMMEDIATE); 8815ed3f7dSjeremylt 8915ed3f7dSjeremylt // Create Schur complement for element corners 9015ed3f7dSjeremylt CeedScalar S[16]; 9115ed3f7dSjeremylt for (CeedInt i = 0; i < 4; i++) { 924fee36f0SJeremy L Thompson CeedScalar *u_array; 934fee36f0SJeremy L Thompson 944fee36f0SJeremy L Thompson CeedVectorSetValue(u, 0.0); 954fee36f0SJeremy L Thompson CeedVectorGetArray(u, CEED_MEM_HOST, &u_array); 9615ed3f7dSjeremylt switch (i) { 972b730f8bSJeremy L Thompson case 0: 984fee36f0SJeremy L Thompson u_array[0] = 1.0; 992b730f8bSJeremy L Thompson break; 1002b730f8bSJeremy L Thompson case 1: 1014fee36f0SJeremy L Thompson u_array[p - 1] = 1.0; 1022b730f8bSJeremy L Thompson break; 1032b730f8bSJeremy L Thompson case 2: 1044fee36f0SJeremy L Thompson u_array[p * p - p] = 1.0; 1052b730f8bSJeremy L Thompson break; 1062b730f8bSJeremy L Thompson case 3: 1074fee36f0SJeremy L Thompson u_array[p * p - 1] = 1.0; 1082b730f8bSJeremy L Thompson break; 10915ed3f7dSjeremylt } 1104fee36f0SJeremy L Thompson CeedVectorRestoreArray(u, &u_array); 11115ed3f7dSjeremylt 1124fee36f0SJeremy L Thompson CeedOperatorApply(op_inverse, u, v, CEED_REQUEST_IMMEDIATE); 11315ed3f7dSjeremylt 1144fee36f0SJeremy L Thompson const CeedScalar *v_array; 1154fee36f0SJeremy L Thompson 1164fee36f0SJeremy L Thompson CeedVectorGetArrayRead(v, CEED_MEM_HOST, &v_array); 1174fee36f0SJeremy L Thompson S[0 * 4 + i] = -v_array[0]; 1184fee36f0SJeremy L Thompson S[1 * 4 + i] = -v_array[p - 1]; 1194fee36f0SJeremy L Thompson S[2 * 4 + i] = -v_array[p * p - p]; 1204fee36f0SJeremy L Thompson S[3 * 4 + i] = -v_array[p * p - 1]; 1214fee36f0SJeremy L Thompson CeedVectorRestoreArrayRead(v, &v_array); 12215ed3f7dSjeremylt } 12315ed3f7dSjeremylt CeedScalar S_inv[16]; 12415ed3f7dSjeremylt { 12515ed3f7dSjeremylt CeedScalar det; 1262b730f8bSJeremy L Thompson S_inv[0] = S[5] * S[10] * S[15] - S[5] * S[11] * S[14] - S[9] * S[6] * S[15] + S[9] * S[7] * S[14] + S[13] * S[6] * S[11] - S[13] * S[7] * S[10]; 12715ed3f7dSjeremylt 1282b730f8bSJeremy L Thompson S_inv[4] = -S[4] * S[10] * S[15] + S[4] * S[11] * S[14] + S[8] * S[6] * S[15] - S[8] * S[7] * S[14] - S[12] * S[6] * S[11] + S[12] * S[7] * S[10]; 12915ed3f7dSjeremylt 1302b730f8bSJeremy L Thompson S_inv[8] = S[4] * S[9] * S[15] - S[4] * S[11] * S[13] - S[8] * S[5] * S[15] + S[8] * S[7] * S[13] + S[12] * S[5] * S[11] - S[12] * S[7] * S[9]; 13115ed3f7dSjeremylt 1322b730f8bSJeremy L Thompson S_inv[12] = -S[4] * S[9] * S[14] + S[4] * S[10] * S[13] + S[8] * S[5] * S[14] - S[8] * S[6] * S[13] - S[12] * S[5] * S[10] + S[12] * S[6] * S[9]; 13315ed3f7dSjeremylt 1342b730f8bSJeremy L Thompson S_inv[1] = -S[1] * S[10] * S[15] + S[1] * S[11] * S[14] + S[9] * S[2] * S[15] - S[9] * S[3] * S[14] - S[13] * S[2] * S[11] + S[13] * S[3] * S[10]; 13515ed3f7dSjeremylt 1362b730f8bSJeremy L Thompson S_inv[5] = S[0] * S[10] * S[15] - S[0] * S[11] * S[14] - S[8] * S[2] * S[15] + S[8] * S[3] * S[14] + S[12] * S[2] * S[11] - S[12] * S[3] * S[10]; 13715ed3f7dSjeremylt 1382b730f8bSJeremy L Thompson S_inv[9] = -S[0] * S[9] * S[15] + S[0] * S[11] * S[13] + S[8] * S[1] * S[15] - S[8] * S[3] * S[13] - S[12] * S[1] * S[11] + S[12] * S[3] * S[9]; 13915ed3f7dSjeremylt 1402b730f8bSJeremy L Thompson S_inv[13] = S[0] * S[9] * S[14] - S[0] * S[10] * S[13] - S[8] * S[1] * S[14] + S[8] * S[2] * S[13] + S[12] * S[1] * S[10] - S[12] * S[2] * S[9]; 14115ed3f7dSjeremylt 1422b730f8bSJeremy L Thompson S_inv[2] = S[1] * S[6] * S[15] - S[1] * S[7] * S[14] - S[5] * S[2] * S[15] + S[5] * S[3] * S[14] + S[13] * S[2] * S[7] - S[13] * S[3] * S[6]; 14315ed3f7dSjeremylt 1442b730f8bSJeremy L Thompson S_inv[6] = -S[0] * S[6] * S[15] + S[0] * S[7] * S[14] + S[4] * S[2] * S[15] - S[4] * S[3] * S[14] - S[12] * S[2] * S[7] + S[12] * S[3] * S[6]; 14515ed3f7dSjeremylt 1462b730f8bSJeremy L Thompson S_inv[10] = S[0] * S[5] * S[15] - S[0] * S[7] * S[13] - S[4] * S[1] * S[15] + S[4] * S[3] * S[13] + S[12] * S[1] * S[7] - S[12] * S[3] * S[5]; 14715ed3f7dSjeremylt 1482b730f8bSJeremy L Thompson S_inv[14] = -S[0] * S[5] * S[14] + S[0] * S[6] * S[13] + S[4] * S[1] * S[14] - S[4] * S[2] * S[13] - S[12] * S[1] * S[6] + S[12] * S[2] * S[5]; 14915ed3f7dSjeremylt 1502b730f8bSJeremy L Thompson S_inv[3] = -S[1] * S[6] * S[11] + S[1] * S[7] * S[10] + S[5] * S[2] * S[11] - S[5] * S[3] * S[10] - S[9] * S[2] * S[7] + S[9] * S[3] * S[6]; 15115ed3f7dSjeremylt 1522b730f8bSJeremy L Thompson S_inv[7] = S[0] * S[6] * S[11] - S[0] * S[7] * S[10] - S[4] * S[2] * S[11] + S[4] * S[3] * S[10] + S[8] * S[2] * S[7] - S[8] * S[3] * S[6]; 15315ed3f7dSjeremylt 1542b730f8bSJeremy L Thompson S_inv[11] = -S[0] * S[5] * S[11] + S[0] * S[7] * S[9] + S[4] * S[1] * S[11] - S[4] * S[3] * S[9] - S[8] * S[1] * S[7] + S[8] * S[3] * S[5]; 15515ed3f7dSjeremylt 1562b730f8bSJeremy L Thompson S_inv[15] = S[0] * S[5] * S[10] - S[0] * S[6] * S[9] - S[4] * S[1] * S[10] + S[4] * S[2] * S[9] + S[8] * S[1] * S[6] - S[8] * S[2] * S[5]; 15715ed3f7dSjeremylt 15815ed3f7dSjeremylt det = 1 / (S[0] * S_inv[0] + S[1] * S_inv[4] + S[2] * S_inv[8] + S[3] * S_inv[12]); 15915ed3f7dSjeremylt 1602b730f8bSJeremy L Thompson for (CeedInt i = 0; i < 16; i++) S_inv[i] *= det; 16115ed3f7dSjeremylt } 16215ed3f7dSjeremylt 16315ed3f7dSjeremylt // Set initial values 16415ed3f7dSjeremylt { 1654fee36f0SJeremy L Thompson CeedScalar nodes[p]; 1664fee36f0SJeremy L Thompson CeedScalar *u_array; 1674fee36f0SJeremy L Thompson 1684fee36f0SJeremy L Thompson CeedLobattoQuadrature(p, nodes, NULL); 1694fee36f0SJeremy L Thompson CeedVectorGetArray(u, CEED_MEM_HOST, &u_array); 1704fee36f0SJeremy L Thompson for (CeedInt i = 0; i < p; i++) { 1714fee36f0SJeremy L Thompson for (CeedInt j = 0; j < p; j++) u_array[i * p + j] = -(nodes[i] - 1.0) * (nodes[i] + 1.0) - (nodes[j] - 1.0) * (nodes[j] + 1.0); 1722b730f8bSJeremy L Thompson } 1734fee36f0SJeremy L Thompson CeedVectorRestoreArray(u, &u_array); 17415ed3f7dSjeremylt } 17515ed3f7dSjeremylt 17615ed3f7dSjeremylt // Apply original operator 1774fee36f0SJeremy L Thompson CeedOperatorApply(op_apply, u, v, CEED_REQUEST_IMMEDIATE); 17815ed3f7dSjeremylt 17915ed3f7dSjeremylt // Apply FDM element inverse 18015ed3f7dSjeremylt { 18115ed3f7dSjeremylt // -- Zero corners 1824fee36f0SJeremy L Thompson CeedScalar *v_array; 1834fee36f0SJeremy L Thompson 1844fee36f0SJeremy L Thompson CeedVectorGetArray(v, CEED_MEM_HOST, &v_array); 1854fee36f0SJeremy L Thompson v_array[0] = 0.0; 1864fee36f0SJeremy L Thompson v_array[p - 1] = 0.0; 1874fee36f0SJeremy L Thompson v_array[p * p - p] = 0.0; 1884fee36f0SJeremy L Thompson v_array[p * p - 1] = 0.0; 1894fee36f0SJeremy L Thompson CeedVectorRestoreArray(v, &v_array); 19015ed3f7dSjeremylt 19115ed3f7dSjeremylt // -- Apply FDM inverse to interior 1924fee36f0SJeremy L Thompson CeedOperatorApply(op_inverse, v, w, CEED_REQUEST_IMMEDIATE); 19315ed3f7dSjeremylt 19415ed3f7dSjeremylt // -- Pick off corners 1954fee36f0SJeremy L Thompson const CeedScalar *w_array; 19615ed3f7dSjeremylt CeedScalar w_Pi[4]; 1974fee36f0SJeremy L Thompson 1984fee36f0SJeremy L Thompson CeedVectorGetArrayRead(w, CEED_MEM_HOST, &w_array); 1994fee36f0SJeremy L Thompson w_Pi[0] = w_array[0]; 2004fee36f0SJeremy L Thompson w_Pi[1] = w_array[p - 1]; 2014fee36f0SJeremy L Thompson w_Pi[2] = w_array[p * p - p]; 2024fee36f0SJeremy L Thompson w_Pi[3] = w_array[p * p - 1]; 2034fee36f0SJeremy L Thompson CeedVectorRestoreArrayRead(w, &w_array); 20415ed3f7dSjeremylt 20515ed3f7dSjeremylt // -- Apply inverse of Schur complement 20615ed3f7dSjeremylt CeedScalar v_Pi[4]; 20715ed3f7dSjeremylt for (CeedInt i = 0; i < 4; i++) { 20815ed3f7dSjeremylt CeedScalar sum = 0.0; 20915ed3f7dSjeremylt for (CeedInt j = 0; j < 4; j++) { 21015ed3f7dSjeremylt sum += w_Pi[j] * S_inv[i * 4 + j]; 21115ed3f7dSjeremylt } 21285cf89eaSjeremylt v_Pi[i] = sum; 21315ed3f7dSjeremylt } 21415ed3f7dSjeremylt 21515ed3f7dSjeremylt // -- Set corners 2164fee36f0SJeremy L Thompson CeedVectorGetArray(v, CEED_MEM_HOST, &v_array); 2174fee36f0SJeremy L Thompson v_array[0] = v_Pi[0]; 2184fee36f0SJeremy L Thompson v_array[p - 1] = v_Pi[1]; 2194fee36f0SJeremy L Thompson v_array[p * p - p] = v_Pi[2]; 2204fee36f0SJeremy L Thompson v_array[p * p - 1] = v_Pi[3]; 2214fee36f0SJeremy L Thompson CeedVectorRestoreArray(v, &v_array); 22215ed3f7dSjeremylt 22315ed3f7dSjeremylt // -- Apply full FDM inverse again 2244fee36f0SJeremy L Thompson CeedOperatorApply(op_inverse, v, w, CEED_REQUEST_IMMEDIATE); 22515ed3f7dSjeremylt } 22615ed3f7dSjeremylt 22715ed3f7dSjeremylt // Check output 22815ed3f7dSjeremylt { 2294fee36f0SJeremy L Thompson const CeedScalar *u_array, *w_array; 2304fee36f0SJeremy L Thompson CeedVectorGetArrayRead(u, CEED_MEM_HOST, &u_array); 2314fee36f0SJeremy L Thompson CeedVectorGetArrayRead(w, CEED_MEM_HOST, &w_array); 2324fee36f0SJeremy L Thompson for (CeedInt i = 0; i < p; i++) { 2334fee36f0SJeremy L Thompson for (CeedInt j = 0; j < p; j++) { 2344fee36f0SJeremy L Thompson if (fabs(u_array[i * p + j] - w_array[i * p + j]) > 2e-3) { 23515ed3f7dSjeremylt // LCOV_EXCL_START 2364fee36f0SJeremy L Thompson printf("[%" CeedInt_FMT ", %" CeedInt_FMT "] Error in inverse: %e != %e\n", i, j, w_array[i * p + j], u_array[i * p + j]); 23715ed3f7dSjeremylt // LCOV_EXCL_STOP 2382b730f8bSJeremy L Thompson } 2392b730f8bSJeremy L Thompson } 2402b730f8bSJeremy L Thompson } 2414fee36f0SJeremy L Thompson CeedVectorRestoreArrayRead(u, &u_array); 2424fee36f0SJeremy L Thompson CeedVectorRestoreArrayRead(w, &w_array); 24315ed3f7dSjeremylt } 24415ed3f7dSjeremylt 24515ed3f7dSjeremylt // Cleanup 2464fee36f0SJeremy L Thompson CeedVectorDestroy(&x); 2474fee36f0SJeremy L Thompson CeedVectorDestroy(&q_data_diff); 2484fee36f0SJeremy L Thompson CeedVectorDestroy(&u); 2494fee36f0SJeremy L Thompson CeedVectorDestroy(&v); 2504fee36f0SJeremy L Thompson CeedVectorDestroy(&w); 2514fee36f0SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restriction_u); 2524fee36f0SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restriction_x); 2534fee36f0SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restriction_q_data); 2544fee36f0SJeremy L Thompson CeedBasisDestroy(&basis_x); 2554fee36f0SJeremy L Thompson CeedBasisDestroy(&basis_u); 25615ed3f7dSjeremylt CeedQFunctionDestroy(&qf_setup_diff); 25715ed3f7dSjeremylt CeedQFunctionDestroy(&qf_apply); 25815ed3f7dSjeremylt CeedOperatorDestroy(&op_setup_diff); 25915ed3f7dSjeremylt CeedOperatorDestroy(&op_apply); 2604fee36f0SJeremy L Thompson CeedOperatorDestroy(&op_inverse); 26115ed3f7dSjeremylt CeedDestroy(&ceed); 26215ed3f7dSjeremylt return 0; 26315ed3f7dSjeremylt } 264