CUTLASS
CUDA Templates for Linear Algebra Subroutines and Solvers
Main Page
Modules
Namespaces
Classes
Files
File List
File Members
include
cutlass
transform
threadblock
regular_tile_access_iterator.h
Go to the documentation of this file.
1
/***************************************************************************************************
2
* Copyright (c) 2017-2019, NVIDIA CORPORATION. All rights reserved.
3
*
4
* Redistribution and use in source and binary forms, with or without
5
*modification, are permitted provided that the following conditions are met:
6
* * Redistributions of source code must retain the above copyright notice,
7
*this list of conditions and the following disclaimer.
8
* * Redistributions in binary form must reproduce the above copyright
9
*notice, this list of conditions and the following disclaimer in the
10
*documentation and/or other materials provided with the distribution.
11
* * Neither the name of the NVIDIA CORPORATION nor the names of its
12
*contributors may be used to endorse or promote products derived from this
13
*software without specific prior written permission.
14
*
15
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
16
*AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17
*IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18
*DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE FOR ANY DIRECT,
19
*INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
20
* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
21
*DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
22
*OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TOR (INCLUDING
23
*NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
24
*EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25
*
26
**************************************************************************************************/
32
#pragma once
33
34
#include "
cutlass/cutlass.h
"
35
37
38
namespace
cutlass
{
39
namespace
transform {
40
namespace
threadblock {
41
43
44
template
<
typename
Shape,
typename
Element,
typename
Layout,
int
AdvanceRank,
45
typename
ThreadMap,
46
int
Alignment =
47
sizeof_bits<Element>::value
* ThreadMap::kElementsPerAccess / 8>
48
class
RegularTileAccessIterator
;
49
51
52
}
// namespace threadblock
53
}
// namespace transform
54
}
// namespace cutlass
cutlass
Definition:
aligned_buffer.h:35
cutlass::sizeof_bits::value
static int const value
Definition:
numeric_types.h:43
cutlass::transform::threadblock::RegularTileAccessIterator
Definition:
regular_tile_access_iterator.h:48
cutlass.h
Basic include for CUTLASS.
Generated by
1.8.11