C/C++ API¶
The C/C++ API allows you to access the custom kernels defined in libtransformer_engine.so library directly from C/C++, without Python.
- activation.h
- cast.h
- gemm.h
- fused_attn.h
- enum NVTE_QKV_Layout
- enumerator NVTE_SB3HD
- enumerator NVTE_SBH3D
- enumerator NVTE_SBHD_SB2HD
- enumerator NVTE_SBHD_SBH2D
- enumerator NVTE_SBHD_SBHD_SBHD
- enumerator NVTE_BS3HD
- enumerator NVTE_BSH3D
- enumerator NVTE_BSHD_BS2HD
- enumerator NVTE_BSHD_BSH2D
- enumerator NVTE_BSHD_BSHD_BSHD
- enumerator NVTE_T3HD
- enumerator NVTE_TH3D
- enumerator NVTE_THD_T2HD
- enumerator NVTE_THD_TH2D
- enumerator NVTE_THD_THD_THD
- enum NVTE_QKV_Layout_Group
- enum NVTE_QKV_Format
- enum NVTE_Bias_Type
- enum NVTE_Mask_Type
- enum NVTE_Fused_Attn_Backend
- NVTE_QKV_Layout_Group nvte_get_qkv_layout_group
- NVTE_QKV_Format nvte_get_qkv_format
- NVTE_Fused_Attn_Backend nvte_get_fused_attn_backend
- void nvte_fused_attn_fwd_qkvpacked
- void nvte_fused_attn_bwd_qkvpacked
- void nvte_fused_attn_fwd_kvpacked
- void nvte_fused_attn_bwd_kvpacked
- void nvte_fused_attn_fwd
- void nvte_fused_attn_bwd
- enum NVTE_QKV_Layout
- layer_norm.h
- rmsnorm.h
- softmax.h
- transformer_engine.h
- typedef void *NVTETensor
- enum NVTEDType
- NVTETensor nvte_create_tensor
- void nvte_destroy_tensor
- NVTEDType nvte_tensor_type
- NVTEShape nvte_tensor_shape
- void *nvte_tensor_data
- float *nvte_tensor_amax
- float *nvte_tensor_scale
- float *nvte_tensor_scale_inv
- void nvte_tensor_pack_create
- void nvte_tensor_pack_destroy
- struct NVTEShape
- struct NVTETensorPack
- namespace transformer_engine
- enum class DType
- struct TensorWrapper
- inline TensorWrapper
- inline TensorWrapper
- inline TensorWrapper
- inline ~TensorWrapper
- TensorWrapper &operator=
- TensorWrapper
- inline TensorWrapper
- inline TensorWrapper &operator=
- inline NVTETensor data
- inline const NVTEShape shape
- inline DType dtype
- inline void *dptr
- inline float *amax
- inline float *scale
- inline float *scale_inv
- NVTETensor tensor_ = nullptr
- transpose.h