Lines Matching refs:thread_1d

152 …CeedInt block_sizes[3] = {data->thread_1d, ((!is_tensor || data->dim == 1) ? 1 : data->thread_1d),…  in CeedOperatorApplyAddCore_Hip_gen()
157 CeedInt elems_per_block = 64 * data->thread_1d > 256 ? 256 / data->thread_1d : 64; in CeedOperatorApplyAddCore_Hip_gen()
164 CeedInt sharedMem = block_sizes[2] * data->thread_1d * sizeof(CeedScalar); in CeedOperatorApplyAddCore_Hip_gen()
170 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorApplyAddCore_Hip_gen()
176 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorApplyAddCore_Hip_gen()
430 …CeedInt block_sizes[3] = {data->thread_1d, ((!is_tensor || data->dim == 1) ? 1 : data->thread_1d),… in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
435 CeedInt elems_per_block = 64 * data->thread_1d > 256 ? 256 / data->thread_1d : 64; in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
442 CeedInt sharedMem = block_sizes[2] * data->thread_1d * sizeof(CeedScalar); in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
448 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
454 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
616 CeedInt block_sizes[3] = {data->thread_1d, (data->dim == 1 ? 1 : data->thread_1d), -1}; in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
622 CeedInt sharedMem = block_sizes[2] * data->thread_1d * sizeof(CeedScalar); in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
628 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
634 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
798 CeedInt block_sizes[3] = {data->thread_1d, (data->dim == 1 ? 1 : data->thread_1d), -1}; in CeedOperatorAssembleSingleAtPoints_Hip_gen()
804 CeedInt sharedMem = block_sizes[2] * data->thread_1d * sizeof(CeedScalar); in CeedOperatorAssembleSingleAtPoints_Hip_gen()
810 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorAssembleSingleAtPoints_Hip_gen()
816 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorAssembleSingleAtPoints_Hip_gen()