CUTLASS
CUDA Templates for Linear Algebra Subroutines and Solvers
Classes | Namespaces
mma_sm75.h File Reference

Matrix multiply for SM75. More...

#include <assert.h>
#include "cutlass/arch/wmma.h"
#include "cutlass/arch/mma.h"
#include "cutlass/layout/matrix.h"
#include "cutlass/numeric_types.h"
Include dependency graph for mma_sm75.h:
This graph shows which files directly or indirectly include this file:

Go to the source code of this file.

Classes

struct  cutlass::arch::Mma< gemm::GemmShape< 16, 8, 8 >, 32, half_t, layout::RowMajor, half_t, layout::ColumnMajor, half_t, layout::RowMajor, OpMultiplyAdd >
 Matrix multiply-add operation - F16 = F16 * F16 + F16. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 16, 8, 8 >, 32, half_t, layout::RowMajor, half_t, layout::ColumnMajor, float, layout::RowMajor, OpMultiplyAdd >
 Matrix multiply-add operation: F32 = F16 * F16 + F32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 16 >, 32, int8_t, layout::RowMajor, int8_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAdd >
 Matrix multiply-add operation: S32 = S8 * S8 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 16 >, 32, uint8_t, layout::RowMajor, int8_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAdd >
 Matrix multiply-add operation: S32 = U8 * S8 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 16 >, 32, int8_t, layout::RowMajor, uint8_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAdd >
 Matrix multiply-add operation: S32 = S8 * U8 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 16 >, 32, uint8_t, layout::RowMajor, uint8_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAdd >
 Matrix multiply-add operation: S32 = S8 * U8 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 16 >, 32, int8_t, layout::RowMajor, int8_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAddSaturate >
 Matrix multiply-add operation: S32 = S8 * S8 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 16 >, 32, uint8_t, layout::RowMajor, int8_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAddSaturate >
 Matrix multiply-add operation: S32 = U8 * S8 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 16 >, 32, int8_t, layout::RowMajor, uint8_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAddSaturate >
 Matrix multiply-add operation: S32 = S8 * U8 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 16 >, 32, uint8_t, layout::RowMajor, uint8_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAddSaturate >
 Matrix multiply-add operation: S32 = S8 * U8 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 32 >, 32, int4b_t, layout::RowMajor, int4b_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAdd >
 Matrix multiply-add operation: S32 = S4 * S4 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 32 >, 32, uint4b_t, layout::RowMajor, int4b_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAdd >
 Matrix multiply-add operation: S32 = U4 * S4 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 32 >, 32, int4b_t, layout::RowMajor, uint4b_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAdd >
 Matrix multiply-add operation: S32 = S4 * U4 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 32 >, 32, uint4b_t, layout::RowMajor, uint4b_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAdd >
 Matrix multiply-add operation: S32 = U4 * U4 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 32 >, 32, int4b_t, layout::RowMajor, int4b_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAddSaturate >
 Matrix multiply-add operation: S32 = S4 * S4 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 32 >, 32, uint4b_t, layout::RowMajor, int4b_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAddSaturate >
 Matrix multiply-add operation: S32 = U4 * S4 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 32 >, 32, int4b_t, layout::RowMajor, uint4b_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAddSaturate >
 Matrix multiply-add operation: S32 = S4 * U4 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 32 >, 32, uint4b_t, layout::RowMajor, uint4b_t, layout::ColumnMajor, int, layout::RowMajor, OpMultiplyAddSaturate >
 Matrix multiply-add operation: S32 = U4 * U4 + S32. More...
 
struct  cutlass::arch::Mma< gemm::GemmShape< 8, 8, 128 >, 32, uint1b_t, layout::RowMajor, uint1b_t, layout::ColumnMajor, int, layout::RowMajor, OpXorPopc >
 Matrix multiply-add operation. More...
 

Namespaces

 cutlass
 
 cutlass::arch