1437c7c90SJeremy L Thompson /// @file 2437c7c90SJeremy L Thompson /// Test assembly of operator diagonal for operator with multiple active bases 3437c7c90SJeremy L Thompson /// \test Test assembly of operator diagonal for operator with multiple active bases 4437c7c90SJeremy L Thompson #include "t539-operator.h" 5437c7c90SJeremy L Thompson 6437c7c90SJeremy L Thompson #include <ceed.h> 7437c7c90SJeremy L Thompson #include <math.h> 8437c7c90SJeremy L Thompson #include <stdlib.h> 9437c7c90SJeremy L Thompson 10437c7c90SJeremy L Thompson int main(int argc, char **argv) { 11437c7c90SJeremy L Thompson Ceed ceed; 12*4fee36f0SJeremy L Thompson CeedElemRestriction elem_restriction_x, elem_restriction_u_0, elem_restriction_u_1, elem_restr_qd_mass, elem_restr_qd_diff; 13437c7c90SJeremy L Thompson CeedBasis basis_x, basis_u_0, basis_u_1; 14437c7c90SJeremy L Thompson CeedQFunction qf_setup_mass, qf_setup_diff, qf_apply; 15437c7c90SJeremy L Thompson CeedOperator op_setup_mass, op_setup_diff, op_apply; 16*4fee36f0SJeremy L Thompson CeedVector q_data_mass, q_data_diff, x, assembled, u, v; 17*4fee36f0SJeremy L Thompson CeedInt num_elem = 6, p_0 = 2, p_1 = 3, q = 4, dim = 2, num_comp_0 = 2, num_comp_1 = 1; 18437c7c90SJeremy L Thompson CeedInt nx = 3, ny = 2; 19*4fee36f0SJeremy L Thompson CeedInt num_dofs_0 = (nx * (p_0 - 1) + 1) * (ny * (p_0 - 1) + 1), num_dofs_1 = (nx * (p_1 - 1) + 1) * (ny * (p_1 - 1) + 1); 20*4fee36f0SJeremy L Thompson CeedInt num_qpts = num_elem * q * q; 21*4fee36f0SJeremy L Thompson CeedInt ind_u_0[num_elem * p_0 * p_0], ind_u_1[num_elem * p_1 * p_1]; 22*4fee36f0SJeremy L Thompson CeedScalar assembled_true[num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1]; 23437c7c90SJeremy L Thompson 24437c7c90SJeremy L Thompson CeedInit(argv[1], &ceed); 25437c7c90SJeremy L Thompson 26*4fee36f0SJeremy L Thompson // Vectors 27*4fee36f0SJeremy L Thompson CeedVectorCreate(ceed, dim * num_dofs_0, &x); 28*4fee36f0SJeremy L Thompson { 29*4fee36f0SJeremy L Thompson CeedScalar x_array[dim * num_dofs_0]; 30*4fee36f0SJeremy L Thompson 31437c7c90SJeremy L Thompson for (CeedInt i = 0; i < nx * 2 + 1; i++) { 32437c7c90SJeremy L Thompson for (CeedInt j = 0; j < ny * 2 + 1; j++) { 33*4fee36f0SJeremy L Thompson x_array[i + j * (nx * 2 + 1) + 0 * num_dofs_0] = (CeedScalar)i / (2 * nx); 34*4fee36f0SJeremy L Thompson x_array[i + j * (nx * 2 + 1) + 1 * num_dofs_0] = (CeedScalar)j / (2 * ny); 35437c7c90SJeremy L Thompson } 36437c7c90SJeremy L Thompson } 37*4fee36f0SJeremy L Thompson CeedVectorSetArray(x, CEED_MEM_HOST, CEED_COPY_VALUES, x_array); 38*4fee36f0SJeremy L Thompson } 39*4fee36f0SJeremy L Thompson CeedVectorCreate(ceed, num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1, &u); 40*4fee36f0SJeremy L Thompson CeedVectorCreate(ceed, num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1, &v); 41437c7c90SJeremy L Thompson CeedVectorCreate(ceed, num_qpts, &q_data_mass); 42437c7c90SJeremy L Thompson CeedVectorCreate(ceed, num_qpts * dim * (dim + 1) / 2, &q_data_diff); 43437c7c90SJeremy L Thompson 44*4fee36f0SJeremy L Thompson // Restrictions 45437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_elem; i++) { 46437c7c90SJeremy L Thompson CeedInt col, row, offset; 47437c7c90SJeremy L Thompson col = i % nx; 48437c7c90SJeremy L Thompson row = i / nx; 49*4fee36f0SJeremy L Thompson offset = col * (p_0 - 1) + row * (nx * (p_0 - 1) + 1) * (p_0 - 1); 50*4fee36f0SJeremy L Thompson for (CeedInt j = 0; j < p_0; j++) { 51*4fee36f0SJeremy L Thompson for (CeedInt k = 0; k < p_0; k++) ind_u_0[p_0 * (p_0 * i + k) + j] = offset + k * (nx * (p_0 - 1) + 1) + j; 52437c7c90SJeremy L Thompson } 53*4fee36f0SJeremy L Thompson offset = col * (p_1 - 1) + row * (nx * (p_1 - 1) + 1) * (p_1 - 1) + num_dofs_0 * num_comp_0; 54*4fee36f0SJeremy L Thompson for (CeedInt j = 0; j < p_1; j++) { 55*4fee36f0SJeremy L Thompson for (CeedInt k = 0; k < p_1; k++) ind_u_1[p_1 * (p_1 * i + k) + j] = offset + k * (nx * (p_1 - 1) + 1) + j; 56437c7c90SJeremy L Thompson } 57437c7c90SJeremy L Thompson } 58*4fee36f0SJeremy L Thompson CeedElemRestrictionCreate(ceed, num_elem, p_0 * p_0, dim, num_dofs_0, dim * num_dofs_0, CEED_MEM_HOST, CEED_USE_POINTER, ind_u_0, 59*4fee36f0SJeremy L Thompson &elem_restriction_x); 60*4fee36f0SJeremy L Thompson CeedElemRestrictionCreate(ceed, num_elem, p_0 * p_0, num_comp_0, num_dofs_0, num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1, CEED_MEM_HOST, 61*4fee36f0SJeremy L Thompson CEED_USE_POINTER, ind_u_0, &elem_restriction_u_0); 62*4fee36f0SJeremy L Thompson CeedElemRestrictionCreate(ceed, num_elem, p_1 * p_1, num_comp_1, num_dofs_1, num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1, CEED_MEM_HOST, 63*4fee36f0SJeremy L Thompson CEED_USE_POINTER, ind_u_1, &elem_restriction_u_1); 64437c7c90SJeremy L Thompson 65*4fee36f0SJeremy L Thompson CeedInt strides_q_data_mass[3] = {1, q * q, q * q}; 66*4fee36f0SJeremy L Thompson CeedElemRestrictionCreateStrided(ceed, num_elem, q * q, 1, num_qpts, strides_q_data_mass, &elem_restr_qd_mass); 67*4fee36f0SJeremy L Thompson 68*4fee36f0SJeremy L Thompson CeedInt strides_q_data_diff[3] = {1, q * q, dim * (dim + 1) / 2 * q * q}; 69*4fee36f0SJeremy L Thompson CeedElemRestrictionCreateStrided(ceed, num_elem, q * q, dim * (dim + 1) / 2, dim * (dim + 1) / 2 * num_qpts, strides_q_data_diff, 70*4fee36f0SJeremy L Thompson &elem_restr_qd_diff); 71437c7c90SJeremy L Thompson 72437c7c90SJeremy L Thompson // Bases 73*4fee36f0SJeremy L Thompson CeedBasisCreateTensorH1Lagrange(ceed, dim, dim, p_0, q, CEED_GAUSS, &basis_x); 74*4fee36f0SJeremy L Thompson CeedBasisCreateTensorH1Lagrange(ceed, dim, num_comp_0, p_0, q, CEED_GAUSS, &basis_u_0); 75*4fee36f0SJeremy L Thompson CeedBasisCreateTensorH1Lagrange(ceed, dim, num_comp_1, p_1, q, CEED_GAUSS, &basis_u_1); 76437c7c90SJeremy L Thompson 77437c7c90SJeremy L Thompson // QFunction - setup mass 78437c7c90SJeremy L Thompson CeedQFunctionCreateInteriorByName(ceed, "Mass2DBuild", &qf_setup_mass); 79437c7c90SJeremy L Thompson 80437c7c90SJeremy L Thompson // Operator - setup mass 81437c7c90SJeremy L Thompson CeedOperatorCreate(ceed, qf_setup_mass, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, &op_setup_mass); 82*4fee36f0SJeremy L Thompson CeedOperatorSetField(op_setup_mass, "dx", elem_restriction_x, basis_x, CEED_VECTOR_ACTIVE); 83437c7c90SJeremy L Thompson CeedOperatorSetField(op_setup_mass, "weights", CEED_ELEMRESTRICTION_NONE, basis_x, CEED_VECTOR_NONE); 84437c7c90SJeremy L Thompson CeedOperatorSetField(op_setup_mass, "qdata", elem_restr_qd_mass, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE); 85437c7c90SJeremy L Thompson 86437c7c90SJeremy L Thompson // QFunction - setup diffusion 87437c7c90SJeremy L Thompson CeedQFunctionCreateInteriorByName(ceed, "Poisson2DBuild", &qf_setup_diff); 88437c7c90SJeremy L Thompson 89437c7c90SJeremy L Thompson // Operator - setup diffusion 90437c7c90SJeremy L Thompson CeedOperatorCreate(ceed, qf_setup_diff, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, &op_setup_diff); 91*4fee36f0SJeremy L Thompson CeedOperatorSetField(op_setup_diff, "dx", elem_restriction_x, basis_x, CEED_VECTOR_ACTIVE); 92437c7c90SJeremy L Thompson CeedOperatorSetField(op_setup_diff, "weights", CEED_ELEMRESTRICTION_NONE, basis_x, CEED_VECTOR_NONE); 93437c7c90SJeremy L Thompson CeedOperatorSetField(op_setup_diff, "qdata", elem_restr_qd_diff, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE); 94437c7c90SJeremy L Thompson 95437c7c90SJeremy L Thompson // Apply Setup Operators 96*4fee36f0SJeremy L Thompson CeedOperatorApply(op_setup_mass, x, q_data_mass, CEED_REQUEST_IMMEDIATE); 97*4fee36f0SJeremy L Thompson CeedOperatorApply(op_setup_diff, x, q_data_diff, CEED_REQUEST_IMMEDIATE); 98437c7c90SJeremy L Thompson 99437c7c90SJeremy L Thompson // QFunction - apply 100437c7c90SJeremy L Thompson CeedQFunctionCreateInterior(ceed, 1, apply, apply_loc, &qf_apply); 101437c7c90SJeremy L Thompson CeedQFunctionAddInput(qf_apply, "du_0", num_comp_0 * dim, CEED_EVAL_GRAD); 102437c7c90SJeremy L Thompson CeedQFunctionAddInput(qf_apply, "mass qdata", 1, CEED_EVAL_NONE); 103437c7c90SJeremy L Thompson CeedQFunctionAddInput(qf_apply, "diff qdata", dim * (dim + 1) / 2, CEED_EVAL_NONE); 104437c7c90SJeremy L Thompson CeedQFunctionAddInput(qf_apply, "u_0", num_comp_0, CEED_EVAL_INTERP); 105437c7c90SJeremy L Thompson CeedQFunctionAddInput(qf_apply, "u_1", num_comp_1, CEED_EVAL_INTERP); 106437c7c90SJeremy L Thompson CeedQFunctionAddOutput(qf_apply, "v_0", num_comp_0, CEED_EVAL_INTERP); 107437c7c90SJeremy L Thompson CeedQFunctionAddOutput(qf_apply, "v_1", num_comp_1, CEED_EVAL_INTERP); 108437c7c90SJeremy L Thompson CeedQFunctionAddOutput(qf_apply, "dv_0", num_comp_0 * dim, CEED_EVAL_GRAD); 109437c7c90SJeremy L Thompson 110437c7c90SJeremy L Thompson // Operator - apply 111437c7c90SJeremy L Thompson CeedOperatorCreate(ceed, qf_apply, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, &op_apply); 112*4fee36f0SJeremy L Thompson CeedOperatorSetField(op_apply, "du_0", elem_restriction_u_0, basis_u_0, CEED_VECTOR_ACTIVE); 113437c7c90SJeremy L Thompson CeedOperatorSetField(op_apply, "mass qdata", elem_restr_qd_mass, CEED_BASIS_COLLOCATED, q_data_mass); 114437c7c90SJeremy L Thompson CeedOperatorSetField(op_apply, "diff qdata", elem_restr_qd_diff, CEED_BASIS_COLLOCATED, q_data_diff); 115*4fee36f0SJeremy L Thompson CeedOperatorSetField(op_apply, "u_0", elem_restriction_u_0, basis_u_0, CEED_VECTOR_ACTIVE); 116*4fee36f0SJeremy L Thompson CeedOperatorSetField(op_apply, "u_1", elem_restriction_u_1, basis_u_1, CEED_VECTOR_ACTIVE); 117*4fee36f0SJeremy L Thompson CeedOperatorSetField(op_apply, "v_0", elem_restriction_u_0, basis_u_0, CEED_VECTOR_ACTIVE); 118*4fee36f0SJeremy L Thompson CeedOperatorSetField(op_apply, "v_1", elem_restriction_u_1, basis_u_1, CEED_VECTOR_ACTIVE); 119*4fee36f0SJeremy L Thompson CeedOperatorSetField(op_apply, "dv_0", elem_restriction_u_0, basis_u_0, CEED_VECTOR_ACTIVE); 120437c7c90SJeremy L Thompson 121437c7c90SJeremy L Thompson // Assemble diagonal 122*4fee36f0SJeremy L Thompson CeedVectorCreate(ceed, num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1, &assembled); 123*4fee36f0SJeremy L Thompson CeedOperatorLinearAssembleDiagonal(op_apply, assembled, CEED_REQUEST_IMMEDIATE); 124437c7c90SJeremy L Thompson 125437c7c90SJeremy L Thompson // Manually assemble diagonal 126*4fee36f0SJeremy L Thompson CeedVectorSetValue(u, 0.0); 127437c7c90SJeremy L Thompson for (int i = 0; i < num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1; i++) assembled_true[i] = 0.0; 128437c7c90SJeremy L Thompson for (int i = 0; i < num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1; i++) { 129437c7c90SJeremy L Thompson // Set input 130*4fee36f0SJeremy L Thompson CeedScalar *u_array; 131*4fee36f0SJeremy L Thompson const CeedScalar *v_array; 132*4fee36f0SJeremy L Thompson 133*4fee36f0SJeremy L Thompson CeedVectorGetArray(u, CEED_MEM_HOST, &u_array); 134*4fee36f0SJeremy L Thompson u_array[i] = 1.0; 135*4fee36f0SJeremy L Thompson if (i) u_array[i - 1] = 0.0; 136*4fee36f0SJeremy L Thompson CeedVectorRestoreArray(u, &u_array); 137437c7c90SJeremy L Thompson 138437c7c90SJeremy L Thompson // Compute diag entry for DoF i 139*4fee36f0SJeremy L Thompson CeedOperatorApply(op_apply, u, v, CEED_REQUEST_IMMEDIATE); 140437c7c90SJeremy L Thompson 141437c7c90SJeremy L Thompson // Retrieve entry 142*4fee36f0SJeremy L Thompson CeedVectorGetArrayRead(v, CEED_MEM_HOST, &v_array); 143*4fee36f0SJeremy L Thompson assembled_true[i] = v_array[i]; 144*4fee36f0SJeremy L Thompson CeedVectorRestoreArrayRead(v, &v_array); 145437c7c90SJeremy L Thompson } 146437c7c90SJeremy L Thompson 147437c7c90SJeremy L Thompson // Check output 148*4fee36f0SJeremy L Thompson { 149*4fee36f0SJeremy L Thompson const CeedScalar *assembled_array; 150*4fee36f0SJeremy L Thompson 151*4fee36f0SJeremy L Thompson CeedVectorGetArrayRead(assembled, CEED_MEM_HOST, &assembled_array); 152437c7c90SJeremy L Thompson for (int i = 0; i < num_comp_0 * num_dofs_0 + num_comp_1 * num_dofs_1; i++) { 153*4fee36f0SJeremy L Thompson if (fabs(assembled_array[i] - assembled_true[i]) > 1000. * CEED_EPSILON) { 154*4fee36f0SJeremy L Thompson // LCOV_EXCL_START 155*4fee36f0SJeremy L Thompson printf("[%" CeedInt_FMT "] Error in assembly: %f != %f\n", i, assembled_array[i], assembled_true[i]); 156*4fee36f0SJeremy L Thompson // LCOV_EXCL_STOP 157437c7c90SJeremy L Thompson } 158*4fee36f0SJeremy L Thompson } 159*4fee36f0SJeremy L Thompson CeedVectorRestoreArrayRead(assembled, &assembled_array); 160*4fee36f0SJeremy L Thompson } 161437c7c90SJeremy L Thompson 162437c7c90SJeremy L Thompson // Cleanup 163*4fee36f0SJeremy L Thompson CeedVectorDestroy(&x); 164*4fee36f0SJeremy L Thompson CeedVectorDestroy(&assembled); 165*4fee36f0SJeremy L Thompson CeedVectorDestroy(&u); 166*4fee36f0SJeremy L Thompson CeedVectorDestroy(&v); 167*4fee36f0SJeremy L Thompson CeedVectorDestroy(&q_data_mass); 168*4fee36f0SJeremy L Thompson CeedVectorDestroy(&q_data_diff); 169*4fee36f0SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restriction_x); 170*4fee36f0SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restriction_u_0); 171*4fee36f0SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restriction_u_1); 172*4fee36f0SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_qd_mass); 173*4fee36f0SJeremy L Thompson CeedElemRestrictionDestroy(&elem_restr_qd_diff); 174*4fee36f0SJeremy L Thompson CeedBasisDestroy(&basis_x); 175*4fee36f0SJeremy L Thompson CeedBasisDestroy(&basis_u_0); 176*4fee36f0SJeremy L Thompson CeedBasisDestroy(&basis_u_1); 177437c7c90SJeremy L Thompson CeedQFunctionDestroy(&qf_setup_mass); 178437c7c90SJeremy L Thompson CeedQFunctionDestroy(&qf_setup_diff); 179437c7c90SJeremy L Thompson CeedQFunctionDestroy(&qf_apply); 180437c7c90SJeremy L Thompson CeedOperatorDestroy(&op_setup_mass); 181437c7c90SJeremy L Thompson CeedOperatorDestroy(&op_setup_diff); 182437c7c90SJeremy L Thompson CeedOperatorDestroy(&op_apply); 183437c7c90SJeremy L Thompson CeedDestroy(&ceed); 184437c7c90SJeremy L Thompson return 0; 185437c7c90SJeremy L Thompson } 186