40 template <
typename Func,
int Rank,
int RankRemaining>
52 for (
int i = 0; i < extent.
at(kActiveRank); ++i) {
60 template <
typename Func,
int Rank>
72 for (
int i = 0; i < extent.
at(kActiveRank); ++i) {
105 template <
typename Element,
typename Func>
112 typename Func::Params params =
typename Func::Params()) {
116 for (
size_t index = 0; index < capacity; ++index) {
Definition: host/tensor_foreach.h:106
Definition: aligned_buffer.h:35
BlockForEach(Element *ptr, size_t capacity, typename Func::Params params=typename Func::Params())
Constructor performs the operation.
Definition: host/tensor_foreach.h:109
static int const kActiveRank
Index of the active rank.
Definition: host/tensor_foreach.h:44
TensorForEachHelper(Func &func, Coord< Rank > const &extent, Coord< Rank > &coord)
Constructor for general rank.
Definition: host/tensor_foreach.h:47
Helper to perform for-each operation.
Definition: host/tensor_foreach.h:41
TensorForEachHelper(Func &func, Coord< Rank > const &extent, Coord< Rank > &coord)
Constructor for fastest changing rank.
Definition: host/tensor_foreach.h:67
Statically-sized array specifying Coords within a tensor.
Definition: coord.h:43
void TensorForEachLambda(Coord< Rank > extent, Func func)
Iterates over the index space of a tensor and calls a C++ lambda.
Definition: host/tensor_foreach.h:98
void TensorForEach(Coord< Rank > extent, Func &func)
Iterates over the index space of a tensor.
Definition: host/tensor_foreach.h:87
CUTLASS_HOST_DEVICE Index & at()
Gets the index of a given Coord element.
Definition: coord.h:255
Basic include for CUTLASS.