CUTLASS
CUDA Templates for Linear Algebra Subroutines and Solvers
regular_tile_access_iterator.h
Go to the documentation of this file.
1 /***************************************************************************************************
2  * Copyright (c) 2017-2019, NVIDIA CORPORATION. All rights reserved.
3  *
4  * Redistribution and use in source and binary forms, with or without
5  *modification, are permitted provided that the following conditions are met:
6  * * Redistributions of source code must retain the above copyright notice,
7  *this list of conditions and the following disclaimer.
8  * * Redistributions in binary form must reproduce the above copyright
9  *notice, this list of conditions and the following disclaimer in the
10  *documentation and/or other materials provided with the distribution.
11  * * Neither the name of the NVIDIA CORPORATION nor the names of its
12  *contributors may be used to endorse or promote products derived from this
13  *software without specific prior written permission.
14  *
15  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
16  *AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17  *IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18  *DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE FOR ANY DIRECT,
19  *INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
20  * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
21  *DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
22  *OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TOR (INCLUDING
23  *NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
24  *EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25  *
26  **************************************************************************************************/
32 #pragma once
33 
34 #include "cutlass/cutlass.h"
35 
37 
38 namespace cutlass {
39 namespace transform {
40 namespace threadblock {
41 
43 
44 template <typename Shape, typename Element, typename Layout, int AdvanceRank,
45  typename ThreadMap,
46  int Alignment =
47  sizeof_bits<Element>::value* ThreadMap::kElementsPerAccess / 8>
49 
51 
52 } // namespace threadblock
53 } // namespace transform
54 } // namespace cutlass
Definition: aligned_buffer.h:35
static int const value
Definition: numeric_types.h:43
Definition: regular_tile_access_iterator.h:48
Basic include for CUTLASS.