include/cuda/experimental/__stream/stream.cuh
File members: include/cuda/experimental/__stream/stream.cuh
//===----------------------------------------------------------------------===//
//
// Part of CUDA Experimental in CUDA C++ Core Libraries,
// under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
// SPDX-FileCopyrightText: Copyright (c) 2024 NVIDIA CORPORATION & AFFILIATES.
//
//===----------------------------------------------------------------------===//
#ifndef _CUDAX__STREAM_STREAM
#define _CUDAX__STREAM_STREAM
#include <cuda/std/detail/__config>
#include <cuda_runtime_api.h>
#if defined(_CCCL_IMPLICIT_SYSTEM_HEADER_GCC)
# pragma GCC system_header
#elif defined(_CCCL_IMPLICIT_SYSTEM_HEADER_CLANG)
# pragma clang system_header
#elif defined(_CCCL_IMPLICIT_SYSTEM_HEADER_MSVC)
# pragma system_header
#endif // no system header
#include <cuda/std/__cuda/api_wrapper.h>
#include <cuda/experimental/__device/device_ref.cuh>
#include <cuda/experimental/__device/logical_device.cuh>
#include <cuda/experimental/__stream/stream_ref.cuh>
#include <cuda/experimental/__utility/ensure_current_device.cuh>
namespace cuda::experimental
{
struct stream : stream_ref
{
// 0 is documented as default priority
static constexpr int default_priority = 0;
explicit stream(device_ref __dev, int __priority = default_priority)
: stream_ref(detail::__invalid_stream)
{
[[maybe_unused]] __ensure_current_device __dev_setter(__dev);
_CCCL_TRY_CUDA_API(
::cudaStreamCreateWithPriority, "Failed to create a stream", &__stream, cudaStreamNonBlocking, __priority);
}
explicit stream(::cuda::experimental::logical_device __dev, int __priority = default_priority)
: stream_ref(detail::__invalid_stream)
{
[[maybe_unused]] __ensure_current_device __dev_setter(__dev);
_CCCL_TRY_CUDA_API(
::cudaStreamCreateWithPriority, "Failed to create a stream", &__stream, cudaStreamNonBlocking, __priority);
}
stream()
: stream(device_ref{0})
{}
// Can't be constexpr because __invalid_stream isn't
explicit stream(uninit_t) noexcept
: stream_ref(detail::__invalid_stream)
{}
stream(stream&& __other) noexcept
: stream(_CUDA_VSTD::exchange(__other.__stream, detail::__invalid_stream))
{}
stream(const stream&) = delete;
~stream()
{
if (__stream != detail::__invalid_stream)
{
// Needs to call driver API in case current device is not set, runtime version would set dev 0 current
// Alternative would be to store the device and push/pop here
[[maybe_unused]] auto status = detail::driver::streamDestroy(__stream);
}
}
stream& operator=(stream&& __other) noexcept
{
stream __tmp(_CUDA_VSTD::move(__other));
_CUDA_VSTD::swap(__stream, __tmp.__stream);
return *this;
}
stream& operator=(const stream&) = delete;
_CCCL_NODISCARD static stream from_native_handle(::cudaStream_t __handle)
{
return stream(__handle);
}
// Disallow construction from an `int`, e.g., `0`.
static stream from_native_handle(int) = delete;
// Disallow construction from `nullptr`.
static stream from_native_handle(_CUDA_VSTD::nullptr_t) = delete;
_CCCL_NODISCARD ::cudaStream_t release()
{
return _CUDA_VSTD::exchange(__stream, detail::__invalid_stream);
}
private:
// Use `stream::from_native_handle(s)` to construct an owning `stream`
// object from a `cudaStream_t` handle.
explicit stream(::cudaStream_t __handle)
: stream_ref(__handle)
{}
};
} // namespace cuda::experimental
#endif // _CUDAX__STREAM_STREAM