1 /// @file 2 /// Test FLOP estimation for composite mass matrix operator 3 /// \test Test FLOP estimation for composite mass matrix operator 4 #include <ceed.h> 5 #include <math.h> 6 #include <stdlib.h> 7 8 #include "t320-basis.h" 9 10 /* The mesh comprises of two rows of 3 quadralaterals followed by one row 11 of 6 triangles: 12 _ _ _ 13 |_|_|_| 14 |_|_|_| 15 |/|/|/| 16 17 */ 18 19 int main(int argc, char **argv) { 20 Ceed ceed; 21 CeedSize flop_estimate; 22 CeedElemRestriction elem_restr_x_tet, elem_restr_u_tet, elem_restr_qd_i_tet, elem_restr_x_hex, elem_restr_u_hex, elem_restr_qd_i_hex; 23 CeedBasis basis_x_tet, basis_u_tet, basis_x_hex, basis_u_hex; 24 CeedQFunction qf_mass; 25 CeedOperator op_mass_tet, op_mass_hex, op_mass; 26 CeedVector q_data_tet, q_data_hex; 27 CeedInt num_elem_tet = 6, P_tet = 6, Q_tet = 4, num_elem_hex = 6, P_hex = 3, Q_hex = 4, dim = 2; 28 CeedInt n_x = 3, n_y = 3, n_x_tet = 3, n_y_tet = 1, n_x_hex = 3; 29 CeedInt row, col, offset; 30 CeedInt num_dofs = (n_x * 2 + 1) * (n_y * 2 + 1), num_qpts_tet = num_elem_tet * Q_tet, num_qpts_hex = num_elem_hex * Q_hex * Q_hex; 31 CeedInt ind_x_tet[num_elem_tet * P_tet], ind_x_hex[num_elem_hex * P_hex * P_hex]; 32 CeedScalar q_ref[dim * Q_tet], q_weight[Q_tet]; 33 CeedScalar interp[P_tet * Q_tet], grad[dim * P_tet * Q_tet]; 34 35 CeedInit(argv[1], &ceed); 36 37 // Qdata Vectors 38 CeedVectorCreate(ceed, num_qpts_tet, &q_data_tet); 39 CeedVectorCreate(ceed, num_qpts_hex, &q_data_hex); 40 41 // Set up Tet Elements 42 for (CeedInt i = 0; i < num_elem_tet / 2; i++) { 43 col = i % n_x_tet; 44 row = i / n_x_tet; 45 offset = col * 2 + row * (n_x_tet * 2 + 1) * 2; 46 47 ind_x_tet[i * 2 * P_tet + 0] = 2 + offset; 48 ind_x_tet[i * 2 * P_tet + 1] = 9 + offset; 49 ind_x_tet[i * 2 * P_tet + 2] = 16 + offset; 50 ind_x_tet[i * 2 * P_tet + 3] = 1 + offset; 51 ind_x_tet[i * 2 * P_tet + 4] = 8 + offset; 52 ind_x_tet[i * 2 * P_tet + 5] = 0 + offset; 53 54 ind_x_tet[i * 2 * P_tet + 6] = 14 + offset; 55 ind_x_tet[i * 2 * P_tet + 7] = 7 + offset; 56 ind_x_tet[i * 2 * P_tet + 8] = 0 + offset; 57 ind_x_tet[i * 2 * P_tet + 9] = 15 + offset; 58 ind_x_tet[i * 2 * P_tet + 10] = 8 + offset; 59 ind_x_tet[i * 2 * P_tet + 11] = 16 + offset; 60 } 61 62 // -- Restrictions 63 CeedElemRestrictionCreate(ceed, num_elem_tet, P_tet, dim, num_dofs, dim * num_dofs, CEED_MEM_HOST, CEED_USE_POINTER, ind_x_tet, &elem_restr_x_tet); 64 65 CeedElemRestrictionCreate(ceed, num_elem_tet, P_tet, 1, 1, num_dofs, CEED_MEM_HOST, CEED_USE_POINTER, ind_x_tet, &elem_restr_u_tet); 66 CeedInt strides_qd_tet[3] = {1, Q_tet, Q_tet}; 67 CeedElemRestrictionCreateStrided(ceed, num_elem_tet, Q_tet, 1, num_qpts_tet, strides_qd_tet, &elem_restr_qd_i_tet); 68 69 // -- Bases 70 buildmats(q_ref, q_weight, interp, grad); 71 CeedBasisCreateH1(ceed, CEED_TOPOLOGY_TRIANGLE, dim, P_tet, Q_tet, interp, grad, q_ref, q_weight, &basis_x_tet); 72 73 buildmats(q_ref, q_weight, interp, grad); 74 CeedBasisCreateH1(ceed, CEED_TOPOLOGY_TRIANGLE, 1, P_tet, Q_tet, interp, grad, q_ref, q_weight, &basis_u_tet); 75 76 // -- QFunction 77 CeedQFunctionCreateInteriorByName(ceed, "MassApply", &qf_mass); 78 79 // -- Operators 80 // ---- Mass Tet 81 CeedOperatorCreate(ceed, qf_mass, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, &op_mass_tet); 82 CeedOperatorSetField(op_mass_tet, "u", elem_restr_u_tet, basis_u_tet, CEED_VECTOR_ACTIVE); 83 CeedOperatorSetField(op_mass_tet, "qdata", elem_restr_qd_i_tet, CEED_BASIS_COLLOCATED, q_data_tet); 84 CeedOperatorSetField(op_mass_tet, "v", elem_restr_u_tet, basis_u_tet, CEED_VECTOR_ACTIVE); 85 86 // Set up Hex Elements 87 for (CeedInt i = 0; i < num_elem_hex; i++) { 88 col = i % n_x_hex; 89 row = i / n_x_hex; 90 offset = (n_x_tet * 2 + 1) * (n_y_tet * 2) * (1 + row) + col * 2; 91 for (CeedInt j = 0; j < P_hex; j++) { 92 for (CeedInt k = 0; k < P_hex; k++) ind_x_hex[P_hex * (P_hex * i + k) + j] = offset + k * (n_x_hex * 2 + 1) + j; 93 } 94 } 95 96 // -- Restrictions 97 CeedElemRestrictionCreate(ceed, num_elem_hex, P_hex * P_hex, dim, num_dofs, dim * num_dofs, CEED_MEM_HOST, CEED_USE_POINTER, ind_x_hex, 98 &elem_restr_x_hex); 99 100 CeedElemRestrictionCreate(ceed, num_elem_hex, P_hex * P_hex, 1, 1, num_dofs, CEED_MEM_HOST, CEED_USE_POINTER, ind_x_hex, &elem_restr_u_hex); 101 CeedInt strides_qd_hex[3] = {1, Q_hex * Q_hex, Q_hex * Q_hex}; 102 CeedElemRestrictionCreateStrided(ceed, num_elem_hex, Q_hex * Q_hex, 1, num_qpts_hex, strides_qd_hex, &elem_restr_qd_i_hex); 103 104 // -- Bases 105 CeedBasisCreateTensorH1Lagrange(ceed, dim, dim, P_hex, Q_hex, CEED_GAUSS, &basis_x_hex); 106 CeedBasisCreateTensorH1Lagrange(ceed, dim, 1, P_hex, Q_hex, CEED_GAUSS, &basis_u_hex); 107 108 // -- Operators 109 CeedOperatorCreate(ceed, qf_mass, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, &op_mass_hex); 110 CeedOperatorSetField(op_mass_hex, "u", elem_restr_u_hex, basis_u_hex, CEED_VECTOR_ACTIVE); 111 CeedOperatorSetField(op_mass_hex, "qdata", elem_restr_qd_i_hex, CEED_BASIS_COLLOCATED, q_data_hex); 112 CeedOperatorSetField(op_mass_hex, "v", elem_restr_u_hex, basis_u_hex, CEED_VECTOR_ACTIVE); 113 114 // Set up Composite Operator 115 // -- Create 116 CeedCompositeOperatorCreate(ceed, &op_mass); 117 // -- Add SubOperators 118 CeedCompositeOperatorAddSub(op_mass, op_mass_tet); 119 CeedCompositeOperatorAddSub(op_mass, op_mass_hex); 120 121 // Estimate FLOPs 122 CeedQFunctionSetUserFlopsEstimate(qf_mass, 1); 123 CeedOperatorGetFlopsEstimate(op_mass, &flop_estimate); 124 125 // Check output 126 if (flop_estimate != 3042) printf("Incorrect FLOP estimate computed, %ld != 3042\n", flop_estimate); 127 128 // Cleanup 129 CeedQFunctionDestroy(&qf_mass); 130 CeedOperatorDestroy(&op_mass_tet); 131 CeedOperatorDestroy(&op_mass_hex); 132 CeedOperatorDestroy(&op_mass); 133 CeedElemRestrictionDestroy(&elem_restr_u_tet); 134 CeedElemRestrictionDestroy(&elem_restr_x_tet); 135 CeedElemRestrictionDestroy(&elem_restr_qd_i_tet); 136 CeedElemRestrictionDestroy(&elem_restr_u_hex); 137 CeedElemRestrictionDestroy(&elem_restr_x_hex); 138 CeedElemRestrictionDestroy(&elem_restr_qd_i_hex); 139 CeedBasisDestroy(&basis_u_tet); 140 CeedBasisDestroy(&basis_x_tet); 141 CeedBasisDestroy(&basis_u_hex); 142 CeedBasisDestroy(&basis_x_hex); 143 CeedVectorDestroy(&q_data_tet); 144 CeedVectorDestroy(&q_data_hex); 145 CeedDestroy(&ceed); 146 return 0; 147 } 148