| /petsc/src/sys/objects/device/impls/ |
| H A D | segmentedmempool.hpp | 201 inline PetscErrorCode MemoryChunk<E>::release(const device::StreamBase<U> *stream) noexcept in release() argument 205 stream_id_ = stream->get_id(); in release() 206 PetscCall(stream->record_event(event_)); in release() 223 inline PetscErrorCode MemoryChunk<E>::claim(const device::StreamBase<U> *stream, size_type req_size… in claim() argument 226 if ((*success = can_claim(stream, req_size, serialize))) { in claim() 227 if (serialize && !stream_compat_(stream)) PetscCall(stream->wait_for_event(event_)); in claim() 247 inline bool MemoryChunk<E>::can_claim(const device::StreamBase<U> *stream, size_type req_size, bool… in can_claim() argument 251 if (stream_compat_(stream)) return true; in can_claim() 347 PetscErrorCode MemoryBlock<T, A, S>::clear_(const stream_type *stream) noexcept in clear_() argument 351 PetscCall(allocator_->deallocate(mem_, stream)); in clear_() [all …]
|
| /petsc/include/petsc/private/ |
| H A D | cupmobject.hpp | 272 cupmStream_t *stream = nullptr; in GetFromHandleDispatch_() local 274 PetscCall(PetscDeviceContextGetStreamHandle_Internal(dctx, (void **)&stream)); in GetFromHandleDispatch_() 275 *stream_handle = *stream; in GetFromHandleDispatch_() 281 …x, cupmBlasHandle_t *blas_handle, cupmSolverHandle_t *solver_handle, cupmStream_t *stream) noexcept in GetHandleDispatch_() argument 289 PetscCall(GetFromHandleDispatch_(dctx_loc, blas_handle, solver_handle, stream)); in GetHandleDispatch_() 295 …x, cupmBlasHandle_t *blas_handle, cupmSolverHandle_t *solver_handle, cupmStream_t *stream) noexcept in GetHandles_() argument 297 return GetHandleDispatch_(dctx, blas_handle, solver_handle, stream); in GetHandles_() 301 …GetHandles_(PetscDeviceContext *dctx, cupmBlasHandle_t *blas_handle, cupmStream_t *stream) noexcept in GetHandles_() argument 303 return GetHandleDispatch_(dctx, blas_handle, nullptr, stream); in GetHandles_() 307 …andles_(PetscDeviceContext *dctx, cupmSolverHandle_t *solver_handle, cupmStream_t *stream) noexcept in GetHandles_() argument [all …]
|
| /petsc/src/sys/objects/device/impls/cupm/ |
| H A D | cupmallocator.hpp | 67 …ed_copy(value_type *dest, const value_type *src, size_type n, const StreamBase<U> *stream) noexcept in uninitialized_copy() argument 70 PetscCall(PetscCUPMMemcpyAsync(dest, src, n, cupmMemcpyHostToHost, stream->get_stream(), true)); in uninitialized_copy() 104 …eviceAllocator<T, P>::allocate(value_type **ptr, size_type n, const StreamBase<U> *stream) noexcept in allocate() argument 107 PetscCall(PetscCUPMMallocAsync(ptr, n, stream->get_stream())); in allocate() 113 …cErrorCode DeviceAllocator<T, P>::deallocate(value_type *ptr, const StreamBase<U> *stream) noexcept in deallocate() argument 116 PetscCallCUPM(cupmFreeAsync(ptr, stream->get_stream())); in deallocate() 122 …ode DeviceAllocator<T, P>::zero(value_type *ptr, size_type n, const StreamBase<U> *stream) noexcept in zero() argument 125 PetscCall(PetscCUPMMemsetAsync(ptr, 0, n, stream->get_stream(), true)); in zero() 131 …ed_copy(value_type *dest, const value_type *src, size_type n, const StreamBase<U> *stream) noexcept in uninitialized_copy() argument 134 …PetscCall(PetscCUPMMemcpyAsync(dest, src, n, cupmMemcpyDeviceToDevice, stream->get_stream(), true)… in uninitialized_copy() [all …]
|
| H A D | cupmcontext.hpp | 50 stream_type stream{}; member 68 …PETSC_NODISCARD const cupmStream_t &get(stream_tag) const noexcept { return this->stream.get_strea… in get() 115 PetscCallCUPMBLAS(cupmBlasSetStream(handle, dci->stream.get_stream())); in initialize_handle_() 142 PetscCallCUPMSOLVER(cupmSolverSetStream(handle, dci->stream.get_stream())); in initialize_handle_() 284 PetscCall(dci->stream.destroy()); in destroy() 300 PetscCall(dci->stream.destroy()); in changeStreamType() 315 PetscCall(dci->stream.change_type(dctx->streamType)); in setUp() 328 switch (auto cerr = cupmStreamQuery(impls_cast_(dctx)->stream.get_stream())) { in query() 353 PetscCallCUPM(cupmEventRecord(event, dcib->stream.get_stream())); in waitForContext() 354 PetscCallCUPM(cupmStreamWaitEvent(impls_cast_(dctxa)->stream.get_stream(), event, 0)); in waitForContext() [all …]
|
| /petsc/src/sys/objects/device/tests/output/ |
| H A D | ex6_root_device_context_stream_type-default_hip.out | 3 stream type: default 10 stream type: default 17 stream type: default 24 stream type: default 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-null_host_no_device.out | 3 stream type: default 10 stream type: default 17 stream type: default 24 stream type: default 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-null_hip.out | 3 stream type: default 10 stream type: default 17 stream type: default 24 stream type: default 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-default_host_with_device.out | 3 stream type: default 10 stream type: default 17 stream type: default 24 stream type: default 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-nonblocking_cuda.out | 3 stream type: nonblocking 10 stream type: nonblocking 17 stream type: nonblocking 24 stream type: nonblocking 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-null_sycl.out | 3 stream type: default 10 stream type: default 17 stream type: default 24 stream type: default 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-default_sycl.out | 3 stream type: default 10 stream type: default 17 stream type: default 24 stream type: default 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-default_with_barrier_hip.out | 3 stream type: default_with_barrier 10 stream type: default_with_barrier 17 stream type: default_with_barrier 24 stream type: default_with_barrier 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-default_with_barrier_host_no_device.out | 3 stream type: default_with_barrier 10 stream type: default_with_barrier 17 stream type: default_with_barrier 24 stream type: default_with_barrier 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-null_cuda.out | 3 stream type: default 10 stream type: default 17 stream type: default 24 stream type: default 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-null_host_with_device.out | 3 stream type: default 10 stream type: default 17 stream type: default 24 stream type: default 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-nonblocking_host_no_device.out | 3 stream type: nonblocking 10 stream type: nonblocking 17 stream type: nonblocking 24 stream type: nonblocking 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-default_with_barrier_host_with_device.out | 3 stream type: default_with_barrier 10 stream type: default_with_barrier 17 stream type: default_with_barrier 24 stream type: default_with_barrier 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-nonblocking_host_with_device.out | 3 stream type: nonblocking 10 stream type: nonblocking 17 stream type: nonblocking 24 stream type: nonblocking 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-default_host_no_device.out | 3 stream type: default 10 stream type: default 17 stream type: default 24 stream type: default 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-default_with_barrier_sycl.out | 3 stream type: default_with_barrier 10 stream type: default_with_barrier 17 stream type: default_with_barrier 24 stream type: default_with_barrier 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-nonblocking_hip.out | 3 stream type: nonblocking 10 stream type: nonblocking 17 stream type: nonblocking 24 stream type: nonblocking 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-default_cuda.out | 3 stream type: default 10 stream type: default 17 stream type: default 24 stream type: default 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-default_with_barrier_cuda.out | 3 stream type: default_with_barrier 10 stream type: default_with_barrier 17 stream type: default_with_barrier 24 stream type: default_with_barrier 31 stream type: default 38 stream type: default
|
| H A D | ex6_root_device_context_stream_type-nonblocking_sycl.out | 3 stream type: nonblocking 10 stream type: nonblocking 17 stream type: nonblocking 24 stream type: nonblocking 31 stream type: default 38 stream type: default
|
| /petsc/src/mat/impls/dense/seq/cupm/ |
| H A D | matseqdensecupm.hpp | 208 cupmStream_t stream; in SetPreallocation_() local 215 PetscCall(GetHandlesFrom_(dctx, &stream)); in SetPreallocation_() 217 if (!mcu->d_user_alloc) PetscCallCUPM(cupmFreeAsync(mcu->d_v, stream)); in SetPreallocation_() 226 PetscCall(PetscCUPMMallocAsync(&mcu->d_v, size, stream)); in SetPreallocation_() 227 PetscCall(PetscCUPMMemsetAsync(mcu->d_v, 0, size, stream)); in SetPreallocation_() 246 cupmStream_t stream; in HostToDevice_() local 250 PetscCall(GetHandlesFrom_(dctx, &stream)); in HostToDevice_() 259 …tscCall(PetscCUPMMemcpy2DAsync(dest, lda, src, lda, nrows, ncols, cupmMemcpyHostToDevice, stream)); in HostToDevice_() 261 PetscCall(PetscCUPMMemcpyAsync(dest, src, lda * ncols, cupmMemcpyHostToDevice, stream)); in HostToDevice_() 283 cupmStream_t stream; in DeviceToHost_() local [all …]
|