51 static inline char const* cutlassGetStatusString(
cutlass::Status status) {
56 return "Error Misaligned Operand";
58 return "Error Invalid Layout";
60 return "Error Invalid Problem";
62 return "Error Not Supported";
64 return "Error Workspace Null";
66 return "Error Internal";
70 return "Invalid status";
76 #if !defined(CUTLASS_ENABLE_TENSOR_CORE_MMA) 77 #define CUTLASS_ENABLE_TENSOR_CORE_MMA 0 82 #if defined(__NVCC__) || (defined(__clang__) && defined(__CUDA__)) 83 #define CUTLASS_HOST_DEVICE __forceinline__ __device__ __host__ 84 #define CUTLASS_DEVICE __forceinline__ __device__ 85 #elif defined(__CUDACC_RTC__) 86 #define CUTLASS_HOST_DEVICE __forceinline__ __device__ 87 #define CUTLASS_DEVICE __forceinline__ __device__ 89 #define CUTLASS_HOST_DEVICE inline 92 #define CUTLASS_ASSERT(x) assert(x) 97 #if defined(__CUDA_ARCH__) 98 #if defined(__CUDACC_RTC__) || (defined(__clang__) && defined(__CUDA__)) 99 #define CUTLASS_PRAGMA_UNROLL _Pragma("unroll") 100 #define CUTLASS_PRAGMA_NO_UNROLL _Pragma("unroll 1") 102 #define CUTLASS_PRAGMA_UNROLL #pragma unroll 103 #define CUTLASS_PRAGMA_NO_UNROLL #pragma unroll 1 106 #define CUTLASS_GEMM_LOOP CUTLASS_PRAGMA_NO_UNROLL 110 #define CUTLASS_PRAGMA_UNROLL 111 #define CUTLASS_PRAGMA_NO_UNROLL 112 #define CUTLASS_GEMM_LOOP 119 static const int NUM_THREADS_PER_WARP = 32;
120 static const int NUM_THREADS_PER_HALF_WARP = NUM_THREADS_PER_WARP / 2;
121 static const int NUM_THREADS_PER_QUAD = 4;
122 static const int NUM_THREADS_PER_QUAD_PAIR = NUM_THREADS_PER_QUAD * 2;
124 #if defined(__NVCC__) || (defined(__clang__) && defined(__CUDA__)) 130 asm (
"mov.u32 %0, %%laneid;" :
"=r"(ret));
Definition: aligned_buffer.h:35
Specified problem size is not supported by operator.
Operation is not supported on current device.
operands fail alignment requirements.
An error within CUTLASS occurred.
The given workspace is null when it is required to be non-null.
Operation was successful.
Layout fails alignment requirement.
Status
Status code returned by CUTLASS operations.
Definition: cutlass.h:39