Home
last modified time | relevance | path

Searched refs:kernels (Results 1 – 25 of 25) sorted by relevance

/petsc/src/vec/is/sf/impls/basic/cupm/
H A Dsfcupm_impl.hpp16 namespace kernels namespace
62 ::Petsc::device::cupm::kernels::util::grid_stride_1D(count, [&](PetscInt tid) { in d_Pack()
75 ::Petsc::device::cupm::kernels::util::grid_stride_1D(count, [&](PetscInt tid) { in d_UnpackAndOp()
88 ::Petsc::device::cupm::kernels::util::grid_stride_1D(count, [&](PetscInt tid) { in d_FetchAndOp()
101 ::Petsc::device::cupm::kernels::util::grid_stride_1D(count, [&](PetscInt tid) { in d_ScatterAndOp()
136 ::Petsc::device::cupm::kernels::util::grid_stride_1D(count, [&](PetscInt tid) { in d_FetchAndOpLocal()
285 …PetscCall(PetscCUPMLaunchKernel1D(count, 0, link->stream, kernels::d_Pack<Type, BS, EQ>, link->bs,… in Pack()
298 …if (PetscDefined(USING_NVCC) && std::is_same<Op, kernels::Insert<Type>>::value && !opt && !idx) { … in UnpackAndOp()
301 …PetscCall(PetscCUPMLaunchKernel1D(count, 0, link->stream, kernels::d_UnpackAndOp<Type, Op, BS, EQ>… in UnpackAndOp()
314 …PetscCall(PetscCUPMLaunchKernel1D(count, 0, link->stream, kernels::d_FetchAndOp<Type, Op, BS, EQ>,… in FetchAndOp()
[all …]
/petsc/src/vec/vec/impls/mpi/cupm/
H A Dvecmpicupm_impl.hpp270 namespace kernels namespace
278 …Petsc::device::cupm::kernels::util::grid_stride_1D(nnz, [=](PetscCount i) { buf[i] = vv[perm[i]]; … in pack_coo_values()
346 …PetscCall(PetscCUPMLaunchKernel1D(sendlen, 0, stream, kernels::pack_coo_values, vv, sendlen, vcu->… in SetValuesCOO()
354 …if (const auto n = x->map->n) PetscCall(PetscCUPMLaunchKernel1D(n, 0, stream, kernels::add_coo_val… in SetValuesCOO()
359 …if (const auto nnz2 = vmpi->nnz2) PetscCall(PetscCUPMLaunchKernel1D(nnz2, 0, stream, kernels::add_… in SetValuesCOO()
/petsc/doc/changes/
H A D231.md9 - Added supported for IBM BGL with optimzed fortran kernels
61 - Changed --with-fortran-kernels=\<0,1> option to
62 --with-fortran-kernels=\<none,generic,bgl>
H A D39.md18 - Added --with-avx512-kernels to specify that hand-coded kernels
H A D312.md22 - The ./configure option --with-avx512-kernels defaults to true now
23 so the manually optimized AVX-512 kernels are used by default
H A D314.md54 example, one can use '--download-kokkos --download-kokkos-kernels
58 Kokkos kernels. Currently, VECKOKKOS supports all vector
H A D322.md18 - Add `--with-openmp-kernels`
H A D34.md157 - Added support to deal with linear systems with non-trivial kernels
H A D321.md103 - Add `MATSELLHIP` and the corresponding HIP kernels for matrix-vector multiplication
/petsc/src/sys/objects/device/impls/cupm/
H A Dkernels.hpp14 namespace kernels namespace
/petsc/src/vec/vec/impls/seq/cupm/
H A Dvecseqcupm.hpp139 namespace kernels namespace
145 ::Petsc::device::cupm::kernels::util::grid_stride_1D(n, [=](PetscCount i) { in add_coo_values_impl()
H A Dvecseqcupm_impl.hpp853 namespace kernels namespace
869 ::Petsc::device::cupm::kernels::util::grid_stride_1D(size, [&](PetscInt i) { in MAXPY_kernel()
914 kernels::MAXPY_kernel<typename detail::repeat_type<const PetscScalar *, Idx>::type...>, in MAXPY_kernel_dispatch_()
1035 namespace kernels namespace
1116 ::Petsc::device::cupm::kernels::util::grid_stride_1D(size, [&](PetscInt i) { in sum_kernel()
1126 ::Petsc::device::cupm::kernels::util::grid_stride_1D(size, [&](PetscInt i) { in sum_kernel()
1160 kernels::MDot_kernel<typename detail::repeat_type<const PetscScalar *, Idx>::type...>, in MDot_kernel_dispatch_()
1253 PetscCall(PetscCUPMLaunchKernel1D(nv, 0, stream, kernels::sum_kernel, nv, d_results)); in MDot_()
2268 …PetscCall(PetscCUPMLaunchKernel1D(n, 0, stream, kernels::add_coo_values, vv, n, vcu->jmap1_d, vcu-… in SetValuesCOO()
/petsc/doc/install/
H A Dexternal_software.md14 - [BLAS/LAPACK](https://www.netlib.org/lapack/lug/node11.html) Optimizes linear algebra kernels (al…
H A Dinstall.md286 These packages provide some basic numeric kernels used by PETSc. `configure` will
655 Use `--with-openmp-kernels` to have some PETSc numerical routines use OpenMP to speed up their comp…
686 … most cases you need only pass the configure option `--download-kokkos` `--download-kokkos-kernels`
/petsc/src/snes/tutorials/output/
H A Dex19_tut_6.out122 Compiled without FORTRAN kernels
H A Dex19_tut_4.out117 Compiled without FORTRAN kernels
H A Dex19_tut_5.out126 Compiled without FORTRAN kernels
H A Dex19_tut_7.out135 Compiled without FORTRAN kernels
/petsc/doc/developers/
H A Dmatrices.md97 sequential kernels in PETSc can dramatically improve overall floating
/petsc/doc/manual/
H A Dgetting_started.md622 The ./configure option `--with-openmp-kernels` causes some PETSc numerical kernels to be compiled u…
643 …open-source package that provides a slightly higher-level programming model to utilize GPU kernels.
645 …r `--with-hip` and, if they plan to use Kokkos, also `--download-kokkos --download-kokkos-kernels`.
H A Dprofiling.md680 lets you see a timeline of code performance information like kernels,
H A Dvec.md573 … number of `*`. This allows one to write very natural Kokkos multi-dimensional parallel for kernels
/petsc/doc/community/meetings/2025/
H A Dindex.md182 … automates the generation of highly optimized explicit finite-difference kernels and stencil compu…
214 …-specific language that automates the application of local computational kernels over a mesh, term…
/petsc/doc/community/meetings/2023/
H A Dindex.md182 kernels libraries with PETSc on modern architectures.
/petsc/doc/tutorials/physics/
H A Dguide_to_stokes.md57 …s. The entire scheme is detailed in {cite}`knepleybrownruppsmith13`. The kernels paired with test …