| /libCEED/examples/deal.II/ |
| H A D | bps-qfunctions.h | 45 CeedPragmaSIMD for (CeedInt i = 0; i < Q; ++i) in f_build_mass() local 47 qdata[i] = J[i] * w[i]; in f_build_mass() 51 CeedPragmaSIMD for (CeedInt i = 0; i < Q; ++i) in f_build_mass() local 53 qdata[i] = (J[i + Q * 0] * J[i + Q * 3] - J[i + Q * 1] * J[i + Q * 2]) * w[i]; in f_build_mass() 57 CeedPragmaSIMD for (CeedInt i = 0; i < Q; ++i) in f_build_mass() local 59 qdata[i] = (J[i + Q * 0] * (J[i + Q * 4] * J[i + Q * 8] - J[i + Q * 5] * J[i + Q * 7]) - in f_build_mass() 60 J[i + Q * 1] * (J[i + Q * 3] * J[i + Q * 8] - J[i + Q * 5] * J[i + Q * 6]) + in f_build_mass() 61 J[i + Q * 2] * (J[i + Q * 3] * J[i + Q * 7] - J[i + Q * 4] * J[i + Q * 6])) * in f_build_mass() 62 w[i]; in f_build_mass() 83 CeedPragmaSIMD for (CeedInt i = 0; i < Q; ++i) in f_apply_mass() local [all …]
|
| /libCEED/backends/sycl-gen/ |
| H A D | ceed-sycl-gen-operator-build.sycl.cpp | 137 for (CeedInt i = 0; i < num_input_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local 138 CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); in CeedOperatorBuildKernel_Sycl_gen() 143 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen() 162 for (CeedInt i = 0; i < num_output_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local 163 CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); in CeedOperatorBuildKernel_Sycl_gen() 168 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen() 193 for (CeedInt i = 0; i < num_input_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local 194 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen() 196 CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); in CeedOperatorBuildKernel_Sycl_gen() 203 for (CeedInt i = 0; i < num_output_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local [all …]
|
| /libCEED/tests/ |
| H A D | t218-elemrestriction.c | 19 for (CeedInt i = 0; i < 3 * num_elem + 1; i++) x_array[i] = 10 + i; in main() local 24 for (CeedInt i = 0; i < num_elem; i++) { in main() local 25 ind[4 * i + 0] = 3 * i + 0; in main() 26 ind[4 * i + 1] = 3 * i + 1; in main() 27 ind[4 * i + 2] = 3 * i + 2; in main() 28 ind[4 * i + 3] = 3 * i + 3; in main() 29 if (i % 2 > 0) { in main() 34 curl_orients[3 * 4 * i + 0] = 0; in main() 35 curl_orients[3 * 4 * i + 1] = 1; in main() 36 curl_orients[3 * 4 * i + 2] = 0; in main() [all …]
|
| H A D | t122-vector.c | 27 for (CeedInt i = 0; i < len; i++) array[i] = i; in main() local 35 for (CeedInt i = 0; i < len; i++) { in main() local 36 if (fabs(read_array[i] - i * i) > 1e-14) { in main() 38 …n w = x .* y at index %" CeedInt_FMT ", computed: %f actual: %f\n", i, read_array[i], 1.0 * i * i); in main() 47 for (CeedInt i = 0; i < len; i++) { in main() local 48 if (fabs(read_array[i] - i * i * i) > 1e-14) { in main() 50 …= w .* y at index %" CeedInt_FMT ", computed: %f actual: %f\n", i, read_array[i], 1.0 * i * i * i); in main() 59 for (CeedInt i = 0; i < len; i++) { in main() local 60 if (fabs(read_array[i] - i * i * i * i) > 1e-14) { in main() 62 ….* w at index %" CeedInt_FMT ", computed: %f actual: %f\n", i, read_array[i], 1.0 * i * i * i * i); in main() [all …]
|
| H A D | t532-operator.h | 13 for (CeedInt i = 0; i < Q; i++) { in setup_mass() local 14 rho[i] = weight[i] * (J[i + Q * 0] * J[i + Q * 3] - J[i + Q * 1] * J[i + Q * 2]); in setup_mass() 31 for (CeedInt i = 0; i < Q; i++) { in setup_diff() local 34 const CeedScalar J11 = J[i + Q * 0]; in setup_diff() 35 const CeedScalar J21 = J[i + Q * 1]; in setup_diff() 36 const CeedScalar J12 = J[i + Q * 2]; in setup_diff() 37 const CeedScalar J22 = J[i + Q * 3]; in setup_diff() 38 const CeedScalar w = qw[i] / (J11 * J22 - J21 * J12); in setup_diff() 39 qd[i + Q * 0] = w * (J12 * J12 + J22 * J22); in setup_diff() 40 qd[i + Q * 1] = w * (J11 * J11 + J21 * J21); in setup_diff() [all …]
|
| H A D | t532-operator-f.h | 11 do i=1,q 12 v1(i)=u2(i)*(u1(i+q*0)*u1(i+q*3)-u1(i+q*1)*u1(i+q*2)) 28 do i=1,q 29 w=u2(i)/(u1(i+q*0)*u1(i+q*3)-u1(i+q*1)*u1(i+q*2)) 30 v1(i+q*0)=w*(u1(i+q*2)*u1(i+q*2)+u1(i+q*3)*u1(i+q*3)) 31 v1(i+q*1)=w*(u1(i+q*0)*u1(i+q*0)+u1(i+q*1)*u1(i+q*1)) 32 v1(i+q*2)=-w*(u1(i+q*0)*u1(i+q*2)+u1(i+q*2)*u1(i+q*3)) 50 do i=1,q 52 v1(i) = u2(i)*u4(i) 54 du0=u1(i+q*0) [all …]
|
| H A D | t219-elemrestriction.c | 22 for (CeedInt i = 0; i < num_elem + 1; i++) x_array[i] = 10 + i; in main() local 26 for (CeedInt i = 0; i < num_elem; i++) { in main() local 27 ind[2 * i + 0] = i; in main() 28 ind[2 * i + 1] = i + 1; in main() 29 curl_orients[3 * 2 * i] = curl_orients[3 * 2 * (i + 1) - 1] = 0; in main() 30 if (i % 2 > 0) { in main() 33 curl_orients[3 * 2 * i + 1] = 0; in main() 34 curl_orients[3 * 2 * i + 2] = -1; in main() 35 curl_orients[3 * 2 * i + 3] = -1; in main() 36 curl_orients[3 * 2 * i + 4] = 0; in main() [all …]
|
| /libCEED/examples/python/qfunctions/ |
| H A D | ex3-volume.h | 26 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in build_mass_diff() local 28 q_data[0][i] = w[i] * J[0][0][i]; in build_mass_diff() 31 q_data[1][i] = w[i] / J[0][0][i]; in build_mass_diff() 37 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in build_mass_diff() local 40 const CeedScalar J00 = J[0][0][i]; in build_mass_diff() 41 const CeedScalar J10 = J[0][1][i]; in build_mass_diff() 42 const CeedScalar J01 = J[1][0][i]; in build_mass_diff() 43 const CeedScalar J11 = J[1][1][i]; in build_mass_diff() 44 const CeedScalar qw = w[i] / (J00 * J11 - J10 * J01); in build_mass_diff() 47 q_data[0][i] = w[i] * (J00 * J11 - J10 * J01); in build_mass_diff() [all …]
|
| H A D | ex1-volume.h | 25 …CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { q_data[i] = J[0][0][i] * w[i]; } // End of Quadr… in build_mass() local 31 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in build_mass() local 32 q_data[i] = (J[0][0][i] * J[1][1][i] - J[0][1][i] * J[1][0][i]) * w[i]; in build_mass() 39 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in build_mass() local 40 q_data[i] = in build_mass() 41 …(J[0][0][i] * (J[1][1][i] * J[2][2][i] - J[1][2][i] * J[2][1][i]) - J[0][1][i] * (J[1][0][i] * J[2… in build_mass() 42 J[0][2][i] * (J[1][0][i] * J[2][1][i] - J[1][1][i] * J[2][0][i])) * in build_mass() 43 w[i]; in build_mass() 58 …CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { v[i] = q_data[i] * u[i]; } // End of Quadrature … in apply_mass() local
|
| H A D | ex2-surface.h | 26 …CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { q_data[0][i] = w[i] / J[0][0][i]; } // End of Qu… in build_diff() local 31 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in build_diff() local 34 const CeedScalar J00 = J[0][0][i]; in build_diff() 35 const CeedScalar J10 = J[0][1][i]; in build_diff() 36 const CeedScalar J01 = J[1][0][i]; in build_diff() 37 const CeedScalar J11 = J[1][1][i]; in build_diff() 38 const CeedScalar qw = w[i] / (J00 * J11 - J10 * J01); in build_diff() 40 q_data[0][i] = qw * (J01 * J01 + J11 * J11); in build_diff() 41 q_data[1][i] = qw * (J00 * J00 + J10 * J10); in build_diff() 42 q_data[2][i] = -qw * (J00 * J01 + J10 * J11); in build_diff() [all …]
|
| /libCEED/examples/ceed/ |
| H A D | ex3-volume.h | 30 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in build_mass_diff() local 32 q_data[0][i] = w[i] * J[0][0][i]; in build_mass_diff() 35 q_data[1][i] = w[i] / J[0][0][i]; in build_mass_diff() 41 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in build_mass_diff() local 44 const CeedScalar J00 = J[0][0][i]; in build_mass_diff() 45 const CeedScalar J10 = J[0][1][i]; in build_mass_diff() 46 const CeedScalar J01 = J[1][0][i]; in build_mass_diff() 47 const CeedScalar J11 = J[1][1][i]; in build_mass_diff() 48 const CeedScalar qw = w[i] / (J00 * J11 - J10 * J01); in build_mass_diff() 51 q_data[0][i] = w[i] * (J00 * J11 - J10 * J01); in build_mass_diff() [all …]
|
| H A D | ex1-volume-f-c.h | 24 …CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { q_data[i] = J[0][0][i] * w[i]; } // End of Quadr… in build_mass() local 30 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in build_mass() local 31 q_data[i] = (J[0][0][i] * J[1][1][i] - J[0][1][i] * J[1][0][i]) * w[i]; in build_mass() 38 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in build_mass() local 39 q_data[i] = in build_mass() 40 …(J[0][0][i] * (J[1][1][i] * J[2][2][i] - J[1][2][i] * J[2][1][i]) - J[0][1][i] * (J[1][0][i] * J[2… in build_mass() 41 J[0][2][i] * (J[1][0][i] * J[2][1][i] - J[1][1][i] * J[2][0][i])) * in build_mass() 42 w[i]; in build_mass() 57 …CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { v[i] = q_data[i] * u[i]; } // End of Quadrature … in apply_mass() local
|
| H A D | ex1-volume.h | 29 …CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { q_data[i] = J[0][0][i] * w[i]; } // End of Quadr… in build_mass() local 35 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in build_mass() local 36 q_data[i] = (J[0][0][i] * J[1][1][i] - J[0][1][i] * J[1][0][i]) * w[i]; in build_mass() 43 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in build_mass() local 44 q_data[i] = in build_mass() 45 …(J[0][0][i] * (J[1][1][i] * J[2][2][i] - J[1][2][i] * J[2][1][i]) - J[0][1][i] * (J[1][0][i] * J[2… in build_mass() 46 J[0][2][i] * (J[1][0][i] * J[2][1][i] - J[1][1][i] * J[2][0][i])) * in build_mass() 47 w[i]; in build_mass() 62 …CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { v[i] = q_data[i] * u[i]; } // End of Quadrature … in apply_mass() local
|
| H A D | ex2-surface.h | 30 …CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { q_data[0][i] = w[i] / J[0][0][i]; } // End of Qu… in build_diff() local 35 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in build_diff() local 38 const CeedScalar J00 = J[0][0][i]; in build_diff() 39 const CeedScalar J10 = J[0][1][i]; in build_diff() 40 const CeedScalar J01 = J[1][0][i]; in build_diff() 41 const CeedScalar J11 = J[1][1][i]; in build_diff() 42 const CeedScalar qw = w[i] / (J00 * J11 - J10 * J01); in build_diff() 44 q_data[0][i] = qw * (J01 * J01 + J11 * J11); in build_diff() 45 q_data[1][i] = qw * (J00 * J00 + J10 * J10); in build_diff() 46 q_data[2][i] = -qw * (J00 * J01 + J10 * J11); in build_diff() [all …]
|
| /libCEED/examples/mfem/ |
| H A D | bp1.h | 26 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { qdata[i] = J[i] * w[i]; } in f_build_mass() local 30 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in f_build_mass() local 33 qdata[i] = (J[i + Q * 0] * J[i + Q * 3] - J[i + Q * 1] * J[i + Q * 2]) * w[i]; in f_build_mass() 38 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in f_build_mass() local 42 qdata[i] = (J[i + Q * 0] * (J[i + Q * 4] * J[i + Q * 8] - J[i + Q * 5] * J[i + Q * 7]) - in f_build_mass() 43 J[i + Q * 1] * (J[i + Q * 3] * J[i + Q * 8] - J[i + Q * 5] * J[i + Q * 6]) + in f_build_mass() 44 J[i + Q * 2] * (J[i + Q * 3] * J[i + Q * 7] - J[i + Q * 4] * J[i + Q * 6])) * in f_build_mass() 45 w[i]; in f_build_mass() 58 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { v[i] = qdata[i] * u[i]; } in f_apply_mass() local
|
| H A D | bp3.h | 28 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { qdata[i] = w[i] / J[i]; } in f_build_diff() local 32 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in f_build_diff() local 35 const CeedScalar J11 = J[i + Q * 0]; in f_build_diff() 36 const CeedScalar J21 = J[i + Q * 1]; in f_build_diff() 37 const CeedScalar J12 = J[i + Q * 2]; in f_build_diff() 38 const CeedScalar J22 = J[i + Q * 3]; in f_build_diff() 39 const CeedScalar qw = w[i] / (J11 * J22 - J21 * J12); in f_build_diff() 40 qdata[i + Q * 0] = qw * (J12 * J12 + J22 * J22); in f_build_diff() 41 qdata[i + Q * 1] = qw * (J11 * J11 + J21 * J21); in f_build_diff() 42 qdata[i + Q * 2] = -qw * (J11 * J12 + J21 * J22); in f_build_diff() [all …]
|
| /libCEED/examples/nek/bps/ |
| H A D | bps.h | 28 for (CeedInt i = 0; i < Q; i++) { in masssetupf() local 29 CeedScalar det = (J[i + Q * 0] * (J[i + Q * 4] * J[i + Q * 8] - J[i + Q * 5] * J[i + Q * 7]) - in masssetupf() 30 J[i + Q * 1] * (J[i + Q * 3] * J[i + Q * 8] - J[i + Q * 5] * J[i + Q * 6]) + in masssetupf() 31 J[i + Q * 2] * (J[i + Q * 3] * J[i + Q * 7] - J[i + Q * 4] * J[i + Q * 6])); in masssetupf() 32 qdata[i] = det * w[i]; in masssetupf() 33 … rhs[i] = qdata[i] * sqrt(x[i] * x[i] + x[i + Q] * x[i + Q] + x[i + 2 * Q] * x[i + 2 * Q]); in masssetupf() 44 for (CeedInt i = 0; i < Q; i++) v[i] = qdata[i] * u[i]; in massf() local 58 for (CeedInt i = 0; i < Q; i++) { in diffsetupf() local 63 const CeedScalar J11 = J[i + Q * 0]; in diffsetupf() 64 const CeedScalar J21 = J[i + Q * 1]; in diffsetupf() [all …]
|
| /libCEED/include/ceed/jit-source/magma/ |
| H A D | magma-common-nontensor.h | 22 int i; in read_A_notrans_g2r_1D_nosync() local 25 for (i = 0; i < P * Q - P * BY; i += P * BY) { in read_A_notrans_g2r_1D_nosync() 26 sA[i + tid] = dA[i + tid]; in read_A_notrans_g2r_1D_nosync() 28 if (i + tid < P * Q) { in read_A_notrans_g2r_1D_nosync() 29 sA[i + tid] = dA[i + tid]; in read_A_notrans_g2r_1D_nosync() 47 int i; in read_A_trans_g2r_1D_nosync() local 50 for (i = 0; i < P * Q - P * BY; i += P * BY) { in read_A_trans_g2r_1D_nosync() 51 sA[i + tid] = dA[i + tid]; in read_A_trans_g2r_1D_nosync() 53 if (i + tid < P * Q) { in read_A_trans_g2r_1D_nosync() 54 sA[i + tid] = dA[i + tid]; in read_A_trans_g2r_1D_nosync() [all …]
|
| /libCEED/examples/petsc/qfunctions/bps/ |
| H A D | bp2.h | 24 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in SetupMassRhs3() local 26 true_soln[i + 0 * Q] = sqrt(x[i] * x[i] + x[i + Q] * x[i + Q] + x[i + 2 * Q] * x[i + 2 * Q]); in SetupMassRhs3() 28 true_soln[i + 1 * Q] = 2 * true_soln[i + 0 * Q]; in SetupMassRhs3() 30 true_soln[i + 2 * Q] = 3 * true_soln[i + 0 * Q]; in SetupMassRhs3() 33 rhs[i + 0 * Q] = w[i] * true_soln[i + 0 * Q]; in SetupMassRhs3() 35 rhs[i + 1 * Q] = 2 * rhs[i + 0 * Q]; in SetupMassRhs3() 37 rhs[i + 2 * Q] = 3 * rhs[i + 0 * Q]; in SetupMassRhs3() 57 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in Mass3() local 59 v[i + 0 * Q] = q_data[i] * u[i + 0 * Q]; in Mass3() 61 v[i + 1 * Q] = q_data[i] * u[i + 1 * Q]; in Mass3() [all …]
|
| H A D | common.h | 17 for (CeedInt i = 0; i < Q; i++) { in Error() local 18 error[i] = (u[i] - target[i]) * (u[i] - target[i]) * q_data[i]; in Error() 27 for (CeedInt i = 0; i < Q; i++) { in Error3() local 28 …error[i + 0 * Q] = (u[i + 0 * Q] - target[i + 0 * Q]) * (u[i + 0 * Q] - target[i + 0 * Q]) * q_dat… in Error3() 29 …error[i + 1 * Q] = (u[i + 1 * Q] - target[i + 1 * Q]) * (u[i + 1 * Q] - target[i + 1 * Q]) * q_dat… in Error3() 30 …error[i + 2 * Q] = (u[i + 2 * Q] - target[i + 2 * Q]) * (u[i + 2 * Q] - target[i + 2 * Q]) * q_dat… in Error3()
|
| H A D | bp24.h | 27 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in SetupMassDiffRhs3() local 32 true_soln[i + 0 * Q] = in SetupMassDiffRhs3() 33 …sin(M_PI * (c[0] + k[0] * x[i + Q * 0])) * sin(M_PI * (c[1] + k[1] * x[i + Q * 1])) * sin(M_PI * (… in SetupMassDiffRhs3() 35 true_soln[i + 1 * Q] = 2 * true_soln[i + 0 * Q]; in SetupMassDiffRhs3() 37 true_soln[i + 2 * Q] = 3 * true_soln[i + 0 * Q]; in SetupMassDiffRhs3() 40 …rhs[i + 0 * Q] = w[i + Q * 0] * (M_PI * M_PI * (k[0] * k[0] + k[1] * k[1] + k[2] * k[2]) + 1.0) * … in SetupMassDiffRhs3() 42 rhs[i + 1 * Q] = 2 * rhs[i + 0 * Q]; in SetupMassDiffRhs3() 44 rhs[i + 2 * Q] = 3 * rhs[i + 0 * Q]; in SetupMassDiffRhs3() 66 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in MassDiff3() local 69 {ug[i + (0 + 0 * 3) * Q], ug[i + (0 + 1 * 3) * Q], ug[i + (0 + 2 * 3) * Q]}, in MassDiff3() [all …]
|
| H A D | bp4.h | 27 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in SetupDiffRhs3() local 32 true_soln[i + 0 * Q] = in SetupDiffRhs3() 33 …sin(M_PI * (c[0] + k[0] * x[i + Q * 0])) * sin(M_PI * (c[1] + k[1] * x[i + Q * 1])) * sin(M_PI * (… in SetupDiffRhs3() 35 true_soln[i + 1 * Q] = 2 * true_soln[i + 0 * Q]; in SetupDiffRhs3() 37 true_soln[i + 2 * Q] = 3 * true_soln[i + 0 * Q]; in SetupDiffRhs3() 40 …rhs[i + 0 * Q] = w[i + Q * 0] * M_PI * M_PI * (k[0] * k[0] + k[1] * k[1] + k[2] * k[2]) * true_sol… in SetupDiffRhs3() 42 rhs[i + 1 * Q] = 2 * rhs[i + 0 * Q]; in SetupDiffRhs3() 44 rhs[i + 2 * Q] = 3 * rhs[i + 0 * Q]; in SetupDiffRhs3() 64 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in Diff3() local 67 {ug[i + (0 + 0 * 3) * Q], ug[i + (0 + 1 * 3) * Q], ug[i + (0 + 2 * 3) * Q]}, in Diff3() [all …]
|
| /libCEED/backends/cuda-ref/ |
| H A D | ceed-cuda-ref-qfunction-load.cpp | 61 for (CeedInt i = 0; i < num_input_fields; i++) { in CeedQFunctionBuildKernel_Cuda_ref() local 62 CeedCallBackend(CeedQFunctionFieldGetSize(input_fields[i], &size)); in CeedQFunctionBuildKernel_Cuda_ref() 63 code << " const CeedInt size_input_" << i << " = " << size << ";\n"; in CeedQFunctionBuildKernel_Cuda_ref() 64 code << " CeedScalar input_" << i << "[size_input_" << i << "];\n"; in CeedQFunctionBuildKernel_Cuda_ref() 67 for (CeedInt i = 0; i < num_input_fields; i++) { in CeedQFunctionBuildKernel_Cuda_ref() local 68 code << " inputs[" << i << "] = input_" << i << ";\n"; in CeedQFunctionBuildKernel_Cuda_ref() 74 for (CeedInt i = 0; i < num_output_fields; i++) { in CeedQFunctionBuildKernel_Cuda_ref() local 75 CeedCallBackend(CeedQFunctionFieldGetSize(output_fields[i], &size)); in CeedQFunctionBuildKernel_Cuda_ref() 76 code << " const CeedInt size_output_" << i << " = " << size << ";\n"; in CeedQFunctionBuildKernel_Cuda_ref() 77 code << " CeedScalar output_" << i << "[size_output_" << i << "];\n"; in CeedQFunctionBuildKernel_Cuda_ref() [all …]
|
| /libCEED/backends/hip-ref/ |
| H A D | ceed-hip-ref-qfunction-load.cpp | 65 for (CeedInt i = 0; i < num_input_fields; i++) { in CeedQFunctionBuildKernel_Hip_ref() local 66 CeedCallBackend(CeedQFunctionFieldGetSize(input_fields[i], &size)); in CeedQFunctionBuildKernel_Hip_ref() 67 code << " const CeedInt size_input_" << i << " = " << size << ";\n"; in CeedQFunctionBuildKernel_Hip_ref() 68 code << " CeedScalar input_" << i << "[size_input_" << i << "];\n"; in CeedQFunctionBuildKernel_Hip_ref() 71 for (CeedInt i = 0; i < num_input_fields; i++) { in CeedQFunctionBuildKernel_Hip_ref() local 72 code << " inputs[" << i << "] = input_" << i << ";\n"; in CeedQFunctionBuildKernel_Hip_ref() 78 for (CeedInt i = 0; i < num_output_fields; i++) { in CeedQFunctionBuildKernel_Hip_ref() local 79 CeedCallBackend(CeedQFunctionFieldGetSize(output_fields[i], &size)); in CeedQFunctionBuildKernel_Hip_ref() 80 code << " const CeedInt size_output_" << i << " = " << size << ";\n"; in CeedQFunctionBuildKernel_Hip_ref() 81 code << " CeedScalar output_" << i << "[size_output_" << i << "];\n"; in CeedQFunctionBuildKernel_Hip_ref() [all …]
|
| /libCEED/examples/solids/qfunctions/ |
| H A D | linear.h | 43 CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { in ElasResidual_Linear() local 46 {ug[0][0][i], ug[1][0][i], ug[2][0][i]}, in ElasResidual_Linear() 47 {ug[0][1][i], ug[1][1][i], ug[2][1][i]}, in ElasResidual_Linear() 48 {ug[0][2][i], ug[1][2][i], ug[2][2][i]} in ElasResidual_Linear() 51 const CeedScalar wdetJ = q_data[0][i]; in ElasResidual_Linear() 53 {q_data[1][i], q_data[2][i], q_data[3][i]}, in ElasResidual_Linear() 54 {q_data[4][i], q_data[5][i], q_data[6][i]}, in ElasResidual_Linear() 55 {q_data[7][i], q_data[8][i], q_data[9][i]} in ElasResidual_Linear() 112 dvdX[k][j][i] = 0; in ElasResidual_Linear() 113 for (CeedInt m = 0; m < 3; m++) dvdX[k][j][i] += dXdx[k][m] * sigma[j][m] * wdetJ; in ElasResidual_Linear() [all …]
|