#include <epilogue_workspace.h>
template<typename Shape_ , int WarpCount, typename FragmentC_ >
template<typename Shape_ , int WarpCount, typename FragmentC_ >
template<typename Shape_ , int WarpCount, typename FragmentC_ >
template<typename Shape_ , int WarpCount, typename FragmentC_ >
- Parameters
-
params | Host-constructable params object |
warp_idx | ID of warp within threadblock |
lane_idx | Id of thread within warp |
template<typename Shape_ , int WarpCount, typename FragmentC_ >
< Accumulator tile
- Parameters
-
problem_size | Problem size of GEMM (units of ElementC) |
tb_tile_coord | Threadblock tile coordinate in GEMM (in units of threadblock tiles) |
template<typename Shape_ , int WarpCount, typename FragmentC_ >
template<typename Shape_ , int WarpCount, typename FragmentC_ >
template<typename Shape_ , int WarpCount, typename FragmentC_ >
template<typename Shape_ , int WarpCount, typename FragmentC_ >
template<typename Shape_ , int WarpCount, typename FragmentC_ >
template<typename Shape_ , int WarpCount, typename FragmentC_ >
template<typename Shape_ , int WarpCount, typename FragmentC_ >
The documentation for this class was generated from the following file: