cuda::experimental::places::exec_place_device#

class exec_place_device : public cuda::experimental::places::exec_place #

Designates execution that is to run on a specific CUDA device.

Device is modeled as a 1-element grid containing that device.

Public Functions

template<typename T> inline ::std::shared_ptr<impl> make_static_instance( )#

inline bool operator==(const exec_place &rhs) const#

inline bool operator!=(const exec_place &rhs) const#

inline bool operator<(const exec_place &rhs) const#

inline bool operator>(const exec_place &rhs) const#

inline bool operator<=(const exec_place &rhs) const#

inline bool operator>=(const exec_place &rhs) const#

inline size_t hash() const#

inline dim4 get_dims() const#

Get the dimensions of this grid.

For scalar places (host, single device), returns dim4(1, 1, 1, 1).

inline size_t size() const#: Get the total number of places in this grid.

inline exec_place get_place(size_t idx) const#

Get the sub-place at the given linear index.

For scalar places, idx must be 0 and returns the place itself.

inline exec_place get_place(pos4 p) const#: Get the sub-place at the given multi-dimensional position.

inline exec_place reshape(const dim4 &dims) const#

Return a grid with new dimensions and the same linear place order.

The product of dims must equal size(), and every extent must be positive. This changes only the coordinate system: for every linear index i, result.get_place(i) == get_place(i).

Parameters:: dims – [in] New grid dimensions
Returns:: A grid over the same places with dimensions dims

inline exec_place collapse_axes( const size_t first_axis, const size_t last_axis ) const#

Collapse a contiguous inclusive range of grid axes.

Axes in [first_axis, last_axis] are replaced by one axis whose extent is their product. Later axes shift left and trailing extents become one. Linear place order is preserved.

Parameters:

first_axis – [in] First axis to collapse (inclusive)
last_axis – [in] Last axis to collapse (inclusive)

Returns:

A grid over the same places with the selected axes collapsed

inline exec_place_scope activate(size_t idx = 0) const#

Activate the sub-place at the given index.

Returns an exec_place_scope RAII guard that automatically deactivates when destroyed. For scalar places, idx should be 0 (the default).

Parameters:: idx – The index of the sub-place to activate (default 0 for scalar places)
Returns:: An exec_place_scope guard that manages the activation lifetime

inline ::std::string to_string() const#

inline data_place affine_data_place() const#

inline void set_affine_data_place(data_place place)#

inline stream_pool &get_stream_pool( bool for_computation, exec_place_resources &res ) const#

Get the stream pool associated with this place from the supplied registry.

Pooled places (device, host) lazily create their entry in res; self-contained places (cuda_stream, green-context) ignore res and return their embedded pool.

inline stream_pool &get_stream_pool( bool for_computation, ::cuda::experimental::stf::async_resources_handle &h ) const#