Lines Matching refs:block_sizes
152 …CeedInt block_sizes[3] = {data->thread_1d, ((!is_tensor || data->dim == 1) ? 1 : data->thread_1d),… in CeedOperatorApplyAddCore_Hip_gen() local
155 …lBackend(BlockGridCalculate_Hip_gen(data->dim, num_elem, data->max_P_1d, data->Q_1d, block_sizes)); in CeedOperatorApplyAddCore_Hip_gen()
160 block_sizes[2] = elems_per_block; in CeedOperatorApplyAddCore_Hip_gen()
163 …CeedInt grid = num_elem / block_sizes[2] + ((num_elem / block_sizes[2] * block_sizes[2] < num… in CeedOperatorApplyAddCore_Hip_gen()
164 CeedInt sharedMem = block_sizes[2] * data->thread_1d * sizeof(CeedScalar); in CeedOperatorApplyAddCore_Hip_gen()
166 …ryRunKernelDimShared_Hip(ceed, data->op, stream, grid, block_sizes[0], block_sizes[1], block_sizes… in CeedOperatorApplyAddCore_Hip_gen()
169 …CeedInt grid = num_elem / block_sizes[2] + ((num_elem / block_sizes[2] * block_sizes[2] < num… in CeedOperatorApplyAddCore_Hip_gen()
170 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorApplyAddCore_Hip_gen()
172 …ryRunKernelDimShared_Hip(ceed, data->op, stream, grid, block_sizes[0], block_sizes[1], block_sizes… in CeedOperatorApplyAddCore_Hip_gen()
175 …CeedInt grid = num_elem / block_sizes[2] + ((num_elem / block_sizes[2] * block_sizes[2] < num… in CeedOperatorApplyAddCore_Hip_gen()
176 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorApplyAddCore_Hip_gen()
178 …ryRunKernelDimShared_Hip(ceed, data->op, stream, grid, block_sizes[0], block_sizes[1], block_sizes… in CeedOperatorApplyAddCore_Hip_gen()
430 …CeedInt block_sizes[3] = {data->thread_1d, ((!is_tensor || data->dim == 1) ? 1 : data->thread_1d),… in CeedOperatorLinearAssembleQFunctionCore_Hip_gen() local
433 …lBackend(BlockGridCalculate_Hip_gen(data->dim, num_elem, data->max_P_1d, data->Q_1d, block_sizes)); in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
438 block_sizes[2] = elems_per_block; in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
441 …CeedInt grid = num_elem / block_sizes[2] + ((num_elem / block_sizes[2] * block_sizes[2] < num… in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
442 CeedInt sharedMem = block_sizes[2] * data->thread_1d * sizeof(CeedScalar); in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
444 …Shared_Hip(ceed, data->assemble_qfunction, NULL, grid, block_sizes[0], block_sizes[1], block_sizes… in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
447 …CeedInt grid = num_elem / block_sizes[2] + ((num_elem / block_sizes[2] * block_sizes[2] < num… in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
448 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
450 …Shared_Hip(ceed, data->assemble_qfunction, NULL, grid, block_sizes[0], block_sizes[1], block_sizes… in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
453 …CeedInt grid = num_elem / block_sizes[2] + ((num_elem / block_sizes[2] * block_sizes[2] < num… in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
454 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
456 …Shared_Hip(ceed, data->assemble_qfunction, NULL, grid, block_sizes[0], block_sizes[1], block_sizes… in CeedOperatorLinearAssembleQFunctionCore_Hip_gen()
616 CeedInt block_sizes[3] = {data->thread_1d, (data->dim == 1 ? 1 : data->thread_1d), -1}; in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen() local
618 …lBackend(BlockGridCalculate_Hip_gen(data->dim, num_elem, data->max_P_1d, data->Q_1d, block_sizes)); in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
619 block_sizes[2] = 1; in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
621 …CeedInt grid = num_elem / block_sizes[2] + ((num_elem / block_sizes[2] * block_sizes[2] < num… in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
622 CeedInt sharedMem = block_sizes[2] * data->thread_1d * sizeof(CeedScalar); in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
624 …mShared_Hip(ceed, data->assemble_diagonal, NULL, grid, block_sizes[0], block_sizes[1], block_sizes… in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
627 …CeedInt grid = num_elem / block_sizes[2] + ((num_elem / block_sizes[2] * block_sizes[2] < num… in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
628 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
630 …mShared_Hip(ceed, data->assemble_diagonal, NULL, grid, block_sizes[0], block_sizes[1], block_sizes… in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
633 …CeedInt grid = num_elem / block_sizes[2] + ((num_elem / block_sizes[2] * block_sizes[2] < num… in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
634 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
636 …mShared_Hip(ceed, data->assemble_diagonal, NULL, grid, block_sizes[0], block_sizes[1], block_sizes… in CeedOperatorLinearAssembleAddDiagonalAtPoints_Hip_gen()
798 CeedInt block_sizes[3] = {data->thread_1d, (data->dim == 1 ? 1 : data->thread_1d), -1}; in CeedOperatorAssembleSingleAtPoints_Hip_gen() local
800 …lBackend(BlockGridCalculate_Hip_gen(data->dim, num_elem, data->max_P_1d, data->Q_1d, block_sizes)); in CeedOperatorAssembleSingleAtPoints_Hip_gen()
801 block_sizes[2] = 1; in CeedOperatorAssembleSingleAtPoints_Hip_gen()
803 …CeedInt grid = num_elem / block_sizes[2] + ((num_elem / block_sizes[2] * block_sizes[2] < num… in CeedOperatorAssembleSingleAtPoints_Hip_gen()
804 CeedInt sharedMem = block_sizes[2] * data->thread_1d * sizeof(CeedScalar); in CeedOperatorAssembleSingleAtPoints_Hip_gen()
806 …elDimShared_Hip(ceed, data->assemble_full, NULL, grid, block_sizes[0], block_sizes[1], block_sizes… in CeedOperatorAssembleSingleAtPoints_Hip_gen()
809 …CeedInt grid = num_elem / block_sizes[2] + ((num_elem / block_sizes[2] * block_sizes[2] < num… in CeedOperatorAssembleSingleAtPoints_Hip_gen()
810 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorAssembleSingleAtPoints_Hip_gen()
812 …elDimShared_Hip(ceed, data->assemble_full, NULL, grid, block_sizes[0], block_sizes[1], block_sizes… in CeedOperatorAssembleSingleAtPoints_Hip_gen()
815 …CeedInt grid = num_elem / block_sizes[2] + ((num_elem / block_sizes[2] * block_sizes[2] < num… in CeedOperatorAssembleSingleAtPoints_Hip_gen()
816 CeedInt sharedMem = block_sizes[2] * data->thread_1d * data->thread_1d * sizeof(CeedScalar); in CeedOperatorAssembleSingleAtPoints_Hip_gen()
818 …elDimShared_Hip(ceed, data->assemble_full, NULL, grid, block_sizes[0], block_sizes[1], block_sizes… in CeedOperatorAssembleSingleAtPoints_Hip_gen()