|
using | Shape = Shape_ |
|
using | ThreadShape = ThreadShape_ |
|
using | LayoutA = LayoutA_ |
|
using | LayoutB = LayoutB_ |
|
using | LayoutC = LayoutC_ |
|
using | ElementA = ElementA_ |
|
using | ElementB = ElementB_ |
|
using | ElementC = ElementC_ |
|
using | IteratorPolicyA = typename platform::conditional< platform::is_same< LayoutA, layout::RowMajor >::value, cutlass::transform::PitchLinearTilePolicyStripminedThreadContiguous< layout::PitchLinearShape< Shape::kK, Shape::kM >, 1, ThreadShape::kK >, cutlass::transform::PitchLinearTilePolicyStripminedThreadStrided< layout::PitchLinearShape< Shape::kM, Shape::kK >, 1, ThreadShape::kM >>::type |
|
using | IteratorA = cutlass::transform::threadblock::PredicatedTileIterator< cutlass::MatrixShape< Shape::kM, Shape::kK >, ElementA, LayoutA, 1, IteratorPolicyA > |
|
using | IteratorPolicyB = typename platform::conditional< platform::is_same< LayoutB, layout::RowMajor >::value, cutlass::transform::PitchLinearTilePolicyStripminedThreadContiguous< layout::PitchLinearShape< Shape::kN, Shape::kK >, kThreadsPerN, ThreadShape::kN >, cutlass::transform::PitchLinearTilePolicyStripminedThreadStrided< layout::PitchLinearShape< Shape::kK, Shape::kN >, kThreadsPerN, ThreadShape::kK >>::type |
|
using | IteratorB = cutlass::transform::threadblock::PredicatedTileIterator< cutlass::MatrixShape< Shape::kK, Shape::kN >, ElementB, LayoutB, 0, IteratorPolicyB > |
|
using | IteratorPolicyC = typename platform::conditional< platform::is_same< LayoutC, layout::RowMajor >::value, cutlass::transform::PitchLinearTilePolicyStripminedThreadContiguous< layout::PitchLinearShape< Shape::kN, Shape::kM >, kThreadsPerN, ThreadShape::kN >, cutlass::transform::PitchLinearTilePolicyStripminedThreadStrided< layout::PitchLinearShape< Shape::kM, Shape::kN >, kThreadsPerN, ThreadShape::kM >>::type |
|
using | IteratorC = cutlass::transform::threadblock::PredicatedTileIterator< cutlass::MatrixShape< Shape::kM, Shape::kN >, ElementC, LayoutC, 0, IteratorPolicyC > |
|
using | MmaSimtOp = typename cutlass::gemm::thread::Mma< cutlass::gemm::GemmShape< ThreadShape::kM, ThreadShape::kN, Shape::kK >, ElementA, LayoutA, ElementB, LayoutB, ElementC, LayoutC > |
|
using | Operator = MmaSimtOp |
|
template<typename Shape_, typename ThreadShape_, typename ElementA_, typename LayoutA_, typename ElementB_, typename LayoutB_, typename ElementC_, typename LayoutC_>
struct cutlass::gemm::threadblock::DefaultGemvCore< Shape_, ThreadShape_, ElementA_, LayoutA_, ElementB_, LayoutB_, ElementC_, LayoutC_ >
Template defininng default vector-matrix multiply operators inferred from threadblock tile size, global memory data layout.