16e15d496SJeremy L Thompson /// @file 26e15d496SJeremy L Thompson /// Test FLOP estimation for composite mass matrix operator 36e15d496SJeremy L Thompson /// \test Test FLOP estimation for composite mass matrix operator 46e15d496SJeremy L Thompson #include <ceed.h> 56e15d496SJeremy L Thompson #include <stdlib.h> 66e15d496SJeremy L Thompson #include <math.h> 76e15d496SJeremy L Thompson #include "t320-basis.h" 86e15d496SJeremy L Thompson 96e15d496SJeremy L Thompson /* The mesh comprises of two rows of 3 quadralaterals followed by one row 106e15d496SJeremy L Thompson of 6 triangles: 116e15d496SJeremy L Thompson _ _ _ 126e15d496SJeremy L Thompson |_|_|_| 136e15d496SJeremy L Thompson |_|_|_| 146e15d496SJeremy L Thompson |/|/|/| 156e15d496SJeremy L Thompson 166e15d496SJeremy L Thompson */ 176e15d496SJeremy L Thompson 186e15d496SJeremy L Thompson int main(int argc, char **argv) { 196e15d496SJeremy L Thompson Ceed ceed; 20*9d36ca50SJeremy L Thompson CeedSize flop_estimate; 216e15d496SJeremy L Thompson CeedElemRestriction elem_restr_x_tet, elem_restr_u_tet, 226e15d496SJeremy L Thompson elem_restr_qd_i_tet, 236e15d496SJeremy L Thompson elem_restr_x_hex, elem_restr_u_hex, 246e15d496SJeremy L Thompson elem_restr_qd_i_hex; 256e15d496SJeremy L Thompson CeedBasis basis_x_tet, basis_u_tet, 266e15d496SJeremy L Thompson basis_x_hex, basis_u_hex; 276e15d496SJeremy L Thompson CeedQFunction qf_mass; 286e15d496SJeremy L Thompson CeedOperator op_mass_tet, op_mass_hex, op_mass; 296e15d496SJeremy L Thompson CeedVector q_data_tet, q_data_hex; 306e15d496SJeremy L Thompson CeedInt num_elem_tet = 6, P_tet = 6, Q_tet = 4, 316e15d496SJeremy L Thompson num_elem_hex = 6, P_hex = 3, Q_hex = 4, dim = 2; 326e15d496SJeremy L Thompson CeedInt n_x = 3, n_y = 3, 336e15d496SJeremy L Thompson n_x_tet = 3, n_y_tet = 1, n_x_hex = 3; 346e15d496SJeremy L Thompson CeedInt row, col, offset; 356e15d496SJeremy L Thompson CeedInt num_dofs = (n_x*2+1)*(n_y*2+1), 366e15d496SJeremy L Thompson num_qpts_tet = num_elem_tet*Q_tet, 376e15d496SJeremy L Thompson num_qpts_hex = num_elem_hex*Q_hex*Q_hex; 386e15d496SJeremy L Thompson CeedInt ind_x_tet[num_elem_tet*P_tet], 396e15d496SJeremy L Thompson ind_x_hex[num_elem_hex*P_hex*P_hex]; 406e15d496SJeremy L Thompson CeedScalar q_ref[dim*Q_tet], q_weight[Q_tet]; 416e15d496SJeremy L Thompson CeedScalar interp[P_tet*Q_tet], grad[dim*P_tet*Q_tet]; 426e15d496SJeremy L Thompson 436e15d496SJeremy L Thompson CeedInit(argv[1], &ceed); 446e15d496SJeremy L Thompson 456e15d496SJeremy L Thompson // Qdata Vectors 466e15d496SJeremy L Thompson CeedVectorCreate(ceed, num_qpts_tet, &q_data_tet); 476e15d496SJeremy L Thompson CeedVectorCreate(ceed, num_qpts_hex, &q_data_hex); 486e15d496SJeremy L Thompson 496e15d496SJeremy L Thompson // Set up Tet Elements 506e15d496SJeremy L Thompson for (CeedInt i=0; i<num_elem_tet/2; i++) { 516e15d496SJeremy L Thompson col = i % n_x_tet; 526e15d496SJeremy L Thompson row = i / n_x_tet; 536e15d496SJeremy L Thompson offset = col*2 + row*(n_x_tet*2+1)*2; 546e15d496SJeremy L Thompson 556e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 0] = 2 + offset; 566e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 1] = 9 + offset; 576e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 2] = 16 + offset; 586e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 3] = 1 + offset; 596e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 4] = 8 + offset; 606e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 5] = 0 + offset; 616e15d496SJeremy L Thompson 626e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 6] = 14 + offset; 636e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 7] = 7 + offset; 646e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 8] = 0 + offset; 656e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 9] = 15 + offset; 666e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 10] = 8 + offset; 676e15d496SJeremy L Thompson ind_x_tet[i*2*P_tet + 11] = 16 + offset; 686e15d496SJeremy L Thompson } 696e15d496SJeremy L Thompson 706e15d496SJeremy L Thompson // -- Restrictions 716e15d496SJeremy L Thompson CeedElemRestrictionCreate(ceed, num_elem_tet, P_tet, dim, num_dofs, 726e15d496SJeremy L Thompson dim*num_dofs, 736e15d496SJeremy L Thompson CEED_MEM_HOST, CEED_USE_POINTER, ind_x_tet, 746e15d496SJeremy L Thompson &elem_restr_x_tet); 756e15d496SJeremy L Thompson 766e15d496SJeremy L Thompson CeedElemRestrictionCreate(ceed, num_elem_tet, P_tet, 1, 1, num_dofs, 776e15d496SJeremy L Thompson CEED_MEM_HOST, CEED_USE_POINTER, ind_x_tet, 786e15d496SJeremy L Thompson &elem_restr_u_tet); 796e15d496SJeremy L Thompson CeedInt strides_qd_tet[3] = {1, Q_tet, Q_tet}; 806e15d496SJeremy L Thompson CeedElemRestrictionCreateStrided(ceed, num_elem_tet, Q_tet, 1, num_qpts_tet, 816e15d496SJeremy L Thompson strides_qd_tet, &elem_restr_qd_i_tet); 826e15d496SJeremy L Thompson 836e15d496SJeremy L Thompson // -- Bases 846e15d496SJeremy L Thompson buildmats(q_ref, q_weight, interp, grad); 856e15d496SJeremy L Thompson CeedBasisCreateH1(ceed, CEED_TOPOLOGY_TRIANGLE, dim, P_tet, Q_tet, interp, grad, 866e15d496SJeremy L Thompson q_ref, q_weight, &basis_x_tet); 876e15d496SJeremy L Thompson 886e15d496SJeremy L Thompson buildmats(q_ref, q_weight, interp, grad); 896e15d496SJeremy L Thompson CeedBasisCreateH1(ceed, CEED_TOPOLOGY_TRIANGLE, 1, P_tet, Q_tet, interp, grad, 906e15d496SJeremy L Thompson q_ref, q_weight, &basis_u_tet); 916e15d496SJeremy L Thompson 926e15d496SJeremy L Thompson // -- QFunction 936e15d496SJeremy L Thompson CeedQFunctionCreateInteriorByName(ceed, "MassApply", &qf_mass); 946e15d496SJeremy L Thompson 956e15d496SJeremy L Thompson // -- Operators 966e15d496SJeremy L Thompson // ---- Mass Tet 976e15d496SJeremy L Thompson CeedOperatorCreate(ceed, qf_mass, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, 986e15d496SJeremy L Thompson &op_mass_tet); 996e15d496SJeremy L Thompson CeedOperatorSetField(op_mass_tet, "u", elem_restr_u_tet, basis_u_tet, 1006e15d496SJeremy L Thompson CEED_VECTOR_ACTIVE); 1016e15d496SJeremy L Thompson CeedOperatorSetField(op_mass_tet, "qdata", elem_restr_qd_i_tet, 1026e15d496SJeremy L Thompson CEED_BASIS_COLLOCATED, 1036e15d496SJeremy L Thompson q_data_tet); 1046e15d496SJeremy L Thompson CeedOperatorSetField(op_mass_tet, "v", elem_restr_u_tet, basis_u_tet, 1056e15d496SJeremy L Thompson CEED_VECTOR_ACTIVE); 1066e15d496SJeremy L Thompson 1076e15d496SJeremy L Thompson // Set up Hex Elements 1086e15d496SJeremy L Thompson for (CeedInt i=0; i<num_elem_hex; i++) { 1096e15d496SJeremy L Thompson col = i % n_x_hex; 1106e15d496SJeremy L Thompson row = i / n_x_hex; 1116e15d496SJeremy L Thompson offset = (n_x_tet*2+1)*(n_y_tet*2)*(1+row) + col*2; 1126e15d496SJeremy L Thompson for (CeedInt j=0; j<P_hex; j++) 1136e15d496SJeremy L Thompson for (CeedInt k=0; k<P_hex; k++) 1146e15d496SJeremy L Thompson ind_x_hex[P_hex*(P_hex*i+k)+j] = offset + k*(n_x_hex*2+1) + j; 1156e15d496SJeremy L Thompson } 1166e15d496SJeremy L Thompson 1176e15d496SJeremy L Thompson // -- Restrictions 1186e15d496SJeremy L Thompson CeedElemRestrictionCreate(ceed, num_elem_hex, P_hex*P_hex, dim, num_dofs, 1196e15d496SJeremy L Thompson dim*num_dofs, 1206e15d496SJeremy L Thompson CEED_MEM_HOST, CEED_USE_POINTER, ind_x_hex, 1216e15d496SJeremy L Thompson &elem_restr_x_hex); 1226e15d496SJeremy L Thompson 1236e15d496SJeremy L Thompson CeedElemRestrictionCreate(ceed, num_elem_hex, P_hex*P_hex, 1, 1, num_dofs, 1246e15d496SJeremy L Thompson CEED_MEM_HOST, CEED_USE_POINTER, ind_x_hex, 1256e15d496SJeremy L Thompson &elem_restr_u_hex); 1266e15d496SJeremy L Thompson CeedInt strides_qd_hex[3] = {1, Q_hex*Q_hex, Q_hex*Q_hex}; 1276e15d496SJeremy L Thompson CeedElemRestrictionCreateStrided(ceed, num_elem_hex, Q_hex*Q_hex, 1, 1286e15d496SJeremy L Thompson num_qpts_hex, 1296e15d496SJeremy L Thompson strides_qd_hex, &elem_restr_qd_i_hex); 1306e15d496SJeremy L Thompson 1316e15d496SJeremy L Thompson // -- Bases 1326e15d496SJeremy L Thompson CeedBasisCreateTensorH1Lagrange(ceed, dim, dim, P_hex, Q_hex, CEED_GAUSS, 1336e15d496SJeremy L Thompson &basis_x_hex); 1346e15d496SJeremy L Thompson CeedBasisCreateTensorH1Lagrange(ceed, dim, 1, P_hex, Q_hex, CEED_GAUSS, 1356e15d496SJeremy L Thompson &basis_u_hex); 1366e15d496SJeremy L Thompson 1376e15d496SJeremy L Thompson // -- Operators 1386e15d496SJeremy L Thompson CeedOperatorCreate(ceed, qf_mass, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, 1396e15d496SJeremy L Thompson &op_mass_hex); 1406e15d496SJeremy L Thompson CeedOperatorSetField(op_mass_hex, "u", elem_restr_u_hex, basis_u_hex, 1416e15d496SJeremy L Thompson CEED_VECTOR_ACTIVE); 1426e15d496SJeremy L Thompson CeedOperatorSetField(op_mass_hex, "qdata", elem_restr_qd_i_hex, 1436e15d496SJeremy L Thompson CEED_BASIS_COLLOCATED, 1446e15d496SJeremy L Thompson q_data_hex); 1456e15d496SJeremy L Thompson CeedOperatorSetField(op_mass_hex, "v", elem_restr_u_hex, basis_u_hex, 1466e15d496SJeremy L Thompson CEED_VECTOR_ACTIVE); 1476e15d496SJeremy L Thompson 1486e15d496SJeremy L Thompson // Set up Composite Operator 1496e15d496SJeremy L Thompson // -- Create 1506e15d496SJeremy L Thompson CeedCompositeOperatorCreate(ceed, &op_mass); 1516e15d496SJeremy L Thompson // -- Add SubOperators 1526e15d496SJeremy L Thompson CeedCompositeOperatorAddSub(op_mass, op_mass_tet); 1536e15d496SJeremy L Thompson CeedCompositeOperatorAddSub(op_mass, op_mass_hex); 1546e15d496SJeremy L Thompson 1556e15d496SJeremy L Thompson // Estimate FLOPs 1566e15d496SJeremy L Thompson CeedQFunctionSetUserFlopsEstimate(qf_mass, 1); 1576e15d496SJeremy L Thompson CeedOperatorGetFlopsEstimate(op_mass, &flop_estimate); 1586e15d496SJeremy L Thompson 1596e15d496SJeremy L Thompson // Check output 1606e15d496SJeremy L Thompson if (flop_estimate != 3042) 1616e15d496SJeremy L Thompson // LCOV_EXCL_START 162*9d36ca50SJeremy L Thompson printf("Incorrect FLOP estimate computed, %ld != 3042\n", flop_estimate); 1636e15d496SJeremy L Thompson // LOCV_EXCL_STOP 1646e15d496SJeremy L Thompson 1656e15d496SJeremy L Thompson // Cleanup 1666e15d496SJeremy L Thompson CeedQFunctionDestroy(&qf_mass); 1676e15d496SJeremy L Thompson CeedOperatorDestroy(&op_mass_tet); 1686e15d496SJeremy L Thompson CeedOperatorDestroy(&op_mass_hex); 1696e15d496SJeremy L Thompson CeedOperatorDestroy(&op_mass); 1706e15d496SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_u_tet); 1716e15d496SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_x_tet); 1726e15d496SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_qd_i_tet); 1736e15d496SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_u_hex); 1746e15d496SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_x_hex); 1756e15d496SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_qd_i_hex); 1766e15d496SJeremy L Thompson CeedBasisDestroy(&basis_u_tet); 1776e15d496SJeremy L Thompson CeedBasisDestroy(&basis_x_tet); 1786e15d496SJeremy L Thompson CeedBasisDestroy(&basis_u_hex); 1796e15d496SJeremy L Thompson CeedBasisDestroy(&basis_x_hex); 1806e15d496SJeremy L Thompson CeedVectorDestroy(&q_data_tet); 1816e15d496SJeremy L Thompson CeedVectorDestroy(&q_data_hex); 1826e15d496SJeremy L Thompson CeedDestroy(&ceed); 1836e15d496SJeremy L Thompson return 0; 1846e15d496SJeremy L Thompson } 185