fused_moegemm_traits.hpp Source File#
fused_moegemm_traits.hpp
Go to the documentation of this file.
Definition tile/core/algorithm/cluster_descriptor.hpp:13
FusedMoeGemmPipelineSequencerEnum
Definition fused_moegemm_traits.hpp:41
FusedMoeGemmWeightPermuteEnum
Definition fused_moegemm_traits.hpp:11
@ no_permute
Definition fused_moegemm_traits.hpp:14
@ b_nr_kr_kw_nw_kv
Definition fused_moegemm_traits.hpp:15
@ b_nr_kr_waveflatten
Definition fused_moegemm_traits.hpp:16
Definition fused_moegemm_traits.hpp:28
static constexpr FusedMoeGemmWeightPermuteEnum PermuteEnum
Definition fused_moegemm_traits.hpp:33
static constexpr bool PadHiddenSize
Definition fused_moegemm_traits.hpp:34
static constexpr bool PipeInterleave
Definition fused_moegemm_traits.hpp:36
static constexpr bool PadIntermediateSize
Definition fused_moegemm_traits.hpp:35
static constexpr bool UseSmoothQuant
Definition fused_moegemm_traits.hpp:31
static constexpr index_t OAtomic
Definition fused_moegemm_traits.hpp:32
static constexpr bool IsGateOnly
Definition fused_moegemm_traits.hpp:30