Lines Matching refs:i

137   for (CeedInt i = 0; i < num_input_fields; i++) {  in CeedOperatorBuildKernel_Sycl_gen()  local
138 CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); in CeedOperatorBuildKernel_Sycl_gen()
143 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen()
162 for (CeedInt i = 0; i < num_output_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
163 CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); in CeedOperatorBuildKernel_Sycl_gen()
168 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen()
193 for (CeedInt i = 0; i < num_input_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
194 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen()
196 CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); in CeedOperatorBuildKernel_Sycl_gen()
203 for (CeedInt i = 0; i < num_output_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
204 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen()
206 CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); in CeedOperatorBuildKernel_Sycl_gen()
251 for (CeedInt i = 0; i < num_input_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
252 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen()
254 code << " global const CeedScalar* d_u_" << i << " = fields->inputs[" << i << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
258 for (CeedInt i = 0; i < num_output_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
259 code << " global CeedScalar* d_v_" << i << " = fields->outputs[" << i << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
272 for (CeedInt i = 0; i < num_input_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
273 code << " // ---- Input field " << i << " ----\n"; in CeedOperatorBuildKernel_Sycl_gen()
275 CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); in CeedOperatorBuildKernel_Sycl_gen()
279 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen()
283 CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); in CeedOperatorBuildKernel_Sycl_gen()
286 code << " const CeedInt P_in_" << i << " = " << P_1d << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
288 code << " const CeedInt P_in_" << i << " = " << Q_1d << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
290 code << " const CeedInt num_comp_in_" << i << " = " << num_comp << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
300 h_B.inputs[i] = basis_impl->d_interp_1d; in CeedOperatorBuildKernel_Sycl_gen()
301 code << " local CeedScalar s_B_in_" << i << "[" << P_1d * Q_1d << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
302 … code << " loadMatrix(P_in_" << i << "*Q_1D, B->inputs[" << i << "], s_B_in_" << i << ");\n"; in CeedOperatorBuildKernel_Sycl_gen()
306 h_B.inputs[i] = basis_impl->d_interp_1d; in CeedOperatorBuildKernel_Sycl_gen()
307 code << " local CeedScalar s_B_in_" << i << "[" << P_1d * Q_1d << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
308 … code << " loadMatrix(P_in_" << i << "*Q_1D, B->inputs[" << i << "], s_B_in_" << i << ");\n"; in CeedOperatorBuildKernel_Sycl_gen()
310 h_G.inputs[i] = basis_impl->d_collo_grad_1d; in CeedOperatorBuildKernel_Sycl_gen()
311 code << " local CeedScalar s_G_in_" << i << "[" << Q_1d * Q_1d << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
312 code << " loadMatrix(Q_1D*Q_1D, G->inputs[" << i << "], s_G_in_" << i << ");\n"; in CeedOperatorBuildKernel_Sycl_gen()
315 … h_G.inputs[i] = has_collo_grad ? basis_impl->d_collo_grad_1d : basis_impl->d_grad_1d; in CeedOperatorBuildKernel_Sycl_gen()
316 …code << " local CeedScalar s_G_in_" << i << "[" << Q_1d * (has_collo_grad ? Q_1d : P_1d) << "];\n… in CeedOperatorBuildKernel_Sycl_gen()
317 …s_collo_grad ? "Q_1D" : ("P_in_" + std::to_string(i))) << "*Q_1D, G->inputs[" << i << "], s_G_in_"… in CeedOperatorBuildKernel_Sycl_gen()
332 for (CeedInt i = 0; i < num_output_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
333 code << " // ---- Output field " << i << " ----\n"; in CeedOperatorBuildKernel_Sycl_gen()
335 CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); in CeedOperatorBuildKernel_Sycl_gen()
339 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen()
342 CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); in CeedOperatorBuildKernel_Sycl_gen()
345 code << " const CeedInt P_out_" << i << " = " << P_1d << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
347 code << " const CeedInt P_out_" << i << " = " << Q_1d << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
349 code << " const CeedInt num_comp_out_" << i << " = " << num_comp << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
358 h_B.outputs[i] = basis_impl->d_interp_1d; in CeedOperatorBuildKernel_Sycl_gen()
359 code << " local CeedScalar s_B_out_" << i << "[" << P_1d * Q_1d << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
360 … code << " loadMatrix(P_out_" << i << "*Q_1D, B->outputs[" << i << "], s_B_out_" << i << ");\n"; in CeedOperatorBuildKernel_Sycl_gen()
364 h_B.outputs[i] = basis_impl->d_interp_1d; in CeedOperatorBuildKernel_Sycl_gen()
365 code << " local CeedScalar s_B_out_" << i << "[" << P_1d * Q_1d << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
366 … code << " loadMatrix(P_out_" << i << "*Q_1D, B->outputs[" << i << "], s_B_out_" << i << ");\n"; in CeedOperatorBuildKernel_Sycl_gen()
368 h_G.outputs[i] = basis_impl->d_collo_grad_1d; in CeedOperatorBuildKernel_Sycl_gen()
369 code << " local CeedScalar s_G_out_" << i << "[" << Q_1d * Q_1d << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
370 code << " loadMatrix(Q_1D*Q_1D, G->outputs[" << i << "], s_G_out_" << i << ");\n"; in CeedOperatorBuildKernel_Sycl_gen()
373 … h_G.outputs[i] = has_collo_grad ? basis_impl->d_collo_grad_1d : basis_impl->d_grad_1d; in CeedOperatorBuildKernel_Sycl_gen()
374 …code << " local CeedScalar s_G_out_" << i << "[" << Q_1d * (has_collo_grad ? Q_1d : P_1d) << "];\… in CeedOperatorBuildKernel_Sycl_gen()
375 …collo_grad ? "Q_1D" : ("P_out_" + std::to_string(i))) << "*Q_1D, G->outputs[" << i << "], s_G_out_… in CeedOperatorBuildKernel_Sycl_gen()
399 for (CeedInt i = 0; i < num_input_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
400 code << " // ---- Input field " << i << " ----\n"; in CeedOperatorBuildKernel_Sycl_gen()
402 CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); in CeedOperatorBuildKernel_Sycl_gen()
405 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen()
411 code << " CeedScalar r_u_" << i << "[num_comp_in_" << i << "*P_in_" << i << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
418 code << " const CeedInt l_size_in_" << i << " = " << l_size << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
422 h_indices.inputs[i] = rstr_impl->d_offsets; in CeedOperatorBuildKernel_Sycl_gen()
423 …fset" << dim << "d(num_comp_in_" << i << ", " << comp_stride << ", P_in_" << i << ", num_elem, ind… in CeedOperatorBuildKernel_Sycl_gen()
424 << "], d_u_" << i << ", r_u_" << i << ");\n"; in CeedOperatorBuildKernel_Sycl_gen()
437 …code << " readDofsStrided" << dim << "d(num_comp_in_" << i << ",P_in_" << i << "," << strides[0… in CeedOperatorBuildKernel_Sycl_gen()
438 << ", num_elem, d_u_" << i << ", r_u_" << i << ");\n"; in CeedOperatorBuildKernel_Sycl_gen()
448 code << " private CeedScalar* r_t_" << i << " = r_u_" << i << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
452 code << " CeedScalar r_t_" << i << "[num_comp_in_" << i << "*Q_1D];\n"; in CeedOperatorBuildKernel_Sycl_gen()
453 …"Tensor" : "") << dim << "d(num_comp_in_" << i << ", P_in_" << i << ", Q_1D, r_u_" << i << ", s_B_… in CeedOperatorBuildKernel_Sycl_gen()
454 << ", r_t_" << i << ", elem_scratch);\n"; in CeedOperatorBuildKernel_Sycl_gen()
458 code << " CeedScalar r_t_" << i << "[num_comp_in_" << i << "*Q_1D];\n"; in CeedOperatorBuildKernel_Sycl_gen()
459 …dim > 1 ? "Tensor" : "") << dim << "d(num_comp_in_" << i << ", P_in_" << i << ", Q_1D, r_u_" << i in CeedOperatorBuildKernel_Sycl_gen()
460 << i << ", r_t_" << i << ", elem_scratch);\n"; in CeedOperatorBuildKernel_Sycl_gen()
464 CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); in CeedOperatorBuildKernel_Sycl_gen()
466 code << " CeedScalar r_t_" << i << "[num_comp_in_" << i << "*DIM*Q_1D];\n"; in CeedOperatorBuildKernel_Sycl_gen()
467 … ? "Tensor" : "") << (dim == 3 && Q_1d >= P_1d ? "Collocated" : "") << dim << "d(num_comp_in_" << i in CeedOperatorBuildKernel_Sycl_gen()
468 …<< ", P_in_" << i << ", Q_1D, r_u_" << i << (dim > 1 ? ", s_B_in_" : "") << (dim > 1 ? std::to_str… in CeedOperatorBuildKernel_Sycl_gen()
469 << ", r_t_" << i << ", elem_scratch);\n"; in CeedOperatorBuildKernel_Sycl_gen()
474 code << " CeedScalar r_t_" << i << "[Q_1D];\n"; in CeedOperatorBuildKernel_Sycl_gen()
475 CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); in CeedOperatorBuildKernel_Sycl_gen()
478 … code << " Weight" << (dim > 1 ? "Tensor" : "") << dim << "d(Q_1D, W, r_t_" << i << ");\n"; in CeedOperatorBuildKernel_Sycl_gen()
490 for (CeedInt i = 0; i < num_output_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
491 code << "\n // ---- Output field " << i << " ----\n"; in CeedOperatorBuildKernel_Sycl_gen()
492 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen()
496 code << " CeedScalar r_tt_" << i << "[num_comp_out_" << i << "*Q_1D];\n"; in CeedOperatorBuildKernel_Sycl_gen()
497 code << " for (CeedInt i = 0; i < num_comp_out_" << i << "; i++) {\n"; in CeedOperatorBuildKernel_Sycl_gen()
499 code << " r_tt_" << i << "[j + i*Q_1D] = 0.0;\n"; in CeedOperatorBuildKernel_Sycl_gen()
503 code << " CeedScalar r_tt_" << i << "[num_comp_out_" << i << "*DIM*Q_1D];\n"; in CeedOperatorBuildKernel_Sycl_gen()
507 code << " CeedScalar r_tt_" << i << "[num_comp_out_" << i << "*Q_1D];\n"; in CeedOperatorBuildKernel_Sycl_gen()
515 for (CeedInt i = 0; i < num_input_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
516 code << " // ---- Input field " << i << " ----\n"; in CeedOperatorBuildKernel_Sycl_gen()
518 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen()
525 code << " CeedScalar r_q_" << i << "[num_comp_in_" << i << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
527 CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); in CeedOperatorBuildKernel_Sycl_gen()
533 code << " const CeedInt l_size_in_" << i << " = " << l_size << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
537 h_indices.inputs[i] = rstr_impl->d_offsets; in CeedOperatorBuildKernel_Sycl_gen()
539 …<< "3d(num_comp_in_" << i << ", " << comp_stride << ", Q_1D, l_size_in_" << i << ", num_elem, q, i… in CeedOperatorBuildKernel_Sycl_gen()
540 << i << ", r_q_" << i << ");\n"; in CeedOperatorBuildKernel_Sycl_gen()
555 …<< "3d(num_comp_in_" << i << ", Q_1D," << strides[0] << ", " << strides[1] << ", " << strides[2] <… in CeedOperatorBuildKernel_Sycl_gen()
556 << ", r_q_" << i << ");\n"; in CeedOperatorBuildKernel_Sycl_gen()
561 code << " CeedScalar r_q_" << i << "[num_comp_in_" << i << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
562 code << " for (CeedInt j = 0; j < num_comp_in_" << i << " ; ++j) {\n"; in CeedOperatorBuildKernel_Sycl_gen()
563 code << " r_q_" << i << "[j] = r_t_" << i << "[q + j*Q_1D];\n"; in CeedOperatorBuildKernel_Sycl_gen()
567 code << " CeedScalar r_q_" << i << "[num_comp_in_" << i << "*DIM];\n"; in CeedOperatorBuildKernel_Sycl_gen()
568 …code << " gradCollo3d(num_comp_in_" << i << ", Q_1D, q, r_t_" << i << ", s_G_in_" << i << ", … in CeedOperatorBuildKernel_Sycl_gen()
571 code << " CeedScalar r_q_" << i << "[1];\n"; in CeedOperatorBuildKernel_Sycl_gen()
572 code << " r_q_" << i << "[0] = r_t_" << i << "[q];\n"; in CeedOperatorBuildKernel_Sycl_gen()
581 for (CeedInt i = 0; i < num_output_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
582 code << " // ---- Output field " << i << " ----\n"; in CeedOperatorBuildKernel_Sycl_gen()
583 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen()
587 code << " CeedScalar r_qq_" << i << "[num_comp_out_" << i << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
590 code << " CeedScalar r_qq_" << i << "[num_comp_out_" << i << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
593 code << " CeedScalar r_qq_" << i << "[num_comp_out_" << i << "*DIM];\n"; in CeedOperatorBuildKernel_Sycl_gen()
606 for (CeedInt i = 0; i < num_input_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
607 code << " // ---- Input field " << i << " ----\n"; in CeedOperatorBuildKernel_Sycl_gen()
608 code << " private CeedScalar* r_q_" << i << " = r_t_" << i << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
611 for (CeedInt i = 0; i < num_output_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
612 code << " // ---- Output field " << i << " ----\n"; in CeedOperatorBuildKernel_Sycl_gen()
613 code << " private CeedScalar* r_qq_" << i << " = r_tt_" << i << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
619 for (CeedInt i = 0; i < num_input_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
620 code << " // ---- Input field " << i << " ----\n"; in CeedOperatorBuildKernel_Sycl_gen()
621 code << " in[" << i << "] = r_q_" << i << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
624 for (CeedInt i = 0; i < num_output_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
625 code << " // ---- Output field " << i << " ----\n"; in CeedOperatorBuildKernel_Sycl_gen()
626 code << " out[" << i << "] = r_qq_" << i << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
641 for (CeedInt i = 0; i < num_output_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
642 code << " // ---- Output field " << i << " ----\n"; in CeedOperatorBuildKernel_Sycl_gen()
643 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen()
648 code << " for (CeedInt j = 0; j < num_comp_out_" << i << " ; ++j) {\n"; in CeedOperatorBuildKernel_Sycl_gen()
649 code << " r_tt_" << i << "[q + j*Q_1D] = r_qq_" << i << "[j];\n"; in CeedOperatorBuildKernel_Sycl_gen()
653 code << " for (CeedInt j = 0; j < num_comp_out_" << i << " ; ++j) {\n"; in CeedOperatorBuildKernel_Sycl_gen()
654 code << " r_tt_" << i << "[q + j*Q_1D] = r_qq_" << i << "[j];\n"; in CeedOperatorBuildKernel_Sycl_gen()
658 … gradColloTranspose3d(num_comp_out_" << i << ",Q_1D, q, r_qq_" << i << ", s_G_out_" << i << ", … in CeedOperatorBuildKernel_Sycl_gen()
675 for (CeedInt i = 0; i < num_output_fields; i++) { in CeedOperatorBuildKernel_Sycl_gen() local
676 code << " // ---- Output field " << i << " ----\n"; in CeedOperatorBuildKernel_Sycl_gen()
678 CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); in CeedOperatorBuildKernel_Sycl_gen()
681 CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); in CeedOperatorBuildKernel_Sycl_gen()
686 code << " private CeedScalar* r_v_" << i << " = r_tt_" << i << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
689 code << " CeedScalar r_v_" << i << "[num_comp_out_" << i << "*P_out_" << i << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
690 …dim > 1 ? "Tensor" : "") << dim << "d(num_comp_out_" << i << ",P_out_" << i << ", Q_1D, r_tt_" << i in CeedOperatorBuildKernel_Sycl_gen()
691 << ", s_B_out_" << i << ", r_v_" << i << ", elem_scratch);\n"; in CeedOperatorBuildKernel_Sycl_gen()
694 code << " CeedScalar r_v_" << i << "[num_comp_out_" << i << "*P_out_" << i << "];\n"; in CeedOperatorBuildKernel_Sycl_gen()
696 …dim > 1 ? "Tensor" : "") << dim << "d(num_comp_out_" << i << ",P_out_" << i << ", Q_1D, r_tt_" << i in CeedOperatorBuildKernel_Sycl_gen()
697 << ", s_B_out_" << i << ", r_v_" << i << ", elem_scratch);\n"; in CeedOperatorBuildKernel_Sycl_gen()
700 CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); in CeedOperatorBuildKernel_Sycl_gen()
702 …? "Tensor" : "") << (dim == 3 && Q_1d >= P_1d ? "Collocated" : "") << dim << "d(num_comp_out_" << i in CeedOperatorBuildKernel_Sycl_gen()
703 …<< ", P_out_" << i << ", Q_1D, r_tt_" << i << (dim > 1 ? ", s_B_out_" : "") << (dim > 1 ? std::to_… in CeedOperatorBuildKernel_Sycl_gen()
704 << ", r_v_" << i << ", elem_scratch);\n"; in CeedOperatorBuildKernel_Sycl_gen()
728 code << " const CeedInt l_size_out_" << i << " = " << l_size << ";\n"; in CeedOperatorBuildKernel_Sycl_gen()
732 h_indices.outputs[i] = rstr_impl->d_offsets; in CeedOperatorBuildKernel_Sycl_gen()
733 …et" << dim << "d(num_comp_out_" << i << ", " << comp_stride << ", P_out_" << i << ", num_elem, ind… in CeedOperatorBuildKernel_Sycl_gen()
734 << "], r_v_" << i << ", d_v_" << i << ");\n"; in CeedOperatorBuildKernel_Sycl_gen()
747 …code << " writeDofsStrided" << dim << "d(num_comp_out_" << i << ",P_out_" << i << "," << stride… in CeedOperatorBuildKernel_Sycl_gen()
748 << ", num_elem, r_v_" << i << ", d_v_" << i << ");\n"; in CeedOperatorBuildKernel_Sycl_gen()