MoeFlatmmHostArgs< ScaleM, ScaleN, ExpertBias > Struct Template Reference#
ck_tile::MoeFlatmmHostArgs< ScaleM, ScaleN, ExpertBias > Struct Template Reference
#include <moe_flatmm_kernel.hpp>
Inheritance diagram for ck_tile::MoeFlatmmHostArgs< ScaleM, ScaleN, ExpertBias >:
Public Member Functions | |
| CK_TILE_HOST | MoeFlatmmHostArgs () noexcept=default |
| CK_TILE_HOST | MoeFlatmmHostArgs (const ck_tile::index_t *p_sorted_token_ids_, const void *p_sorted_expert_weights_, const ck_tile::index_t *p_sorted_expert_ids_, const ck_tile::index_t *p_max_token_id_, const void *a_ptr_, const void *b_ptr_, void *c_ptr_, ck_tile::index_t NumTokens_, ck_tile::index_t NumExperts_, ck_tile::index_t TopK_, ck_tile::index_t k_batch_, ck_tile::index_t M_, ck_tile::index_t N_, ck_tile::index_t K_, ck_tile::index_t stride_A_, ck_tile::index_t stride_B_, ck_tile::index_t stride_C_, ScaleM scale_m_={}, ScaleN scale_n_={}, ExpertBias exp_bias_={}) |
| CK_TILE_HOST | MoeFlatmmHostArgs (const ck_tile::index_t *p_sorted_token_ids_, const void *p_sorted_expert_weights_, const ck_tile::index_t *p_sorted_expert_ids_, const ck_tile::index_t *p_max_token_id_, const void *a_ptr_, const void *b_ptr_, void *c_ptr_, ck_tile::index_t NumTokens_, ck_tile::index_t NumExperts_, ck_tile::index_t TopK_, ck_tile::index_t k_batch_, ck_tile::index_t M_, ck_tile::index_t N_, ck_tile::index_t K_, ck_tile::index_t stride_A_, ck_tile::index_t stride_B_, ck_tile::index_t stride_C_, ck_tile::index_t n_padded_zeros_=0, ck_tile::index_t k_padded_zeros_=0, ScaleM scale_m_={}, ScaleN scale_n_={}, ExpertBias exp_bias_={}) |
| Public Member Functions inherited from ck_tile::ScaleFlatmmHostArgs< ScaleM, ScaleN, NumDTensor > | |
| CK_TILE_HOST | ScaleFlatmmHostArgs ()=default |
| CK_TILE_HOST | ScaleFlatmmHostArgs (const void *a_ptr_, const void *b_shuffle_ptr_, const std::array< const void *, NumDTensor > &ds_ptr_, void *c_ptr_, index_t k_batch_, index_t M_, index_t N_, index_t K_, index_t stride_A_, index_t stride_B_, const std::array< index_t, NumDTensor > &stride_Ds_, index_t stride_C_, ScaleM scale_m_=nullptr, ScaleN scale_n_=nullptr) |
| Public Member Functions inherited from ck_tile::BaseFlatmmHostArgs< NumDTensor > | |
| CK_TILE_HOST | BaseFlatmmHostArgs ()=default |
| CK_TILE_HOST | BaseFlatmmHostArgs (const void *a_ptr_, const void *b_ptr_, const std::array< const void *, NumDTensor > &ds_ptr_, void *e_ptr_, index_t k_batch_, index_t M_, index_t N_, index_t K_, index_t stride_A_, index_t stride_B_, const std::array< index_t, NumDTensor > &stride_Ds_, index_t stride_E_) |
Public Attributes | |
| ck_tile::index_t | NumTokens |
| ck_tile::index_t | NumExperts |
| ck_tile::index_t | TopK |
| const ck_tile::index_t * | p_sorted_token_ids |
| const ck_tile::index_t * | p_sorted_expert_ids |
| const ck_tile::index_t * | p_max_token_id |
| const void * | p_sorted_expert_weights |
| const ck_tile::index_t | n_padded_zeros |
| const ck_tile::index_t | k_padded_zeros |
| ExpertBias | exp_bias |
| Public Attributes inherited from ck_tile::ScaleFlatmmHostArgs< ScaleM, ScaleN, NumDTensor > | |
| ScaleM | scale_m = nullptr |
| ScaleN | scale_n = nullptr |
| Public Attributes inherited from ck_tile::BaseFlatmmHostArgs< NumDTensor > | |
| const void * | a_ptr |
| const void * | b_ptr |
| const std::array< const void *, NumDTensor > | ds_ptr |
| union { | |
| void * e_ptr | |
| void * c_ptr | |
| }; | |
| index_t | M |
| index_t | N |
| index_t | K |
| index_t | stride_A |
| index_t | stride_B |
| const std::array< index_t, NumDTensor > | stride_Ds |
| union { | |
| index_t stride_E | |
| index_t stride_C | |
| }; | |
| index_t | k_batch |
Constructor & Destructor Documentation
◆ MoeFlatmmHostArgs() [1/3]
template<class ScaleM = FlatmmScalePointer<-1>, class ScaleN = FlatmmScalePointer<-1>, class ExpertBias = FlatmmScalePointer<-1>>
|
defaultnoexcept |
◆ MoeFlatmmHostArgs() [2/3]
template<class ScaleM = FlatmmScalePointer<-1>, class ScaleN = FlatmmScalePointer<-1>, class ExpertBias = FlatmmScalePointer<-1>>
|
inline |
◆ MoeFlatmmHostArgs() [3/3]
template<class ScaleM = FlatmmScalePointer<-1>, class ScaleN = FlatmmScalePointer<-1>, class ExpertBias = FlatmmScalePointer<-1>>
|
inline |
Member Data Documentation
◆ exp_bias
template<class ScaleM = FlatmmScalePointer<-1>, class ScaleN = FlatmmScalePointer<-1>, class ExpertBias = FlatmmScalePointer<-1>>
| ExpertBias ck_tile::MoeFlatmmHostArgs< ScaleM, ScaleN, ExpertBias >::exp_bias |
◆ k_padded_zeros
template<class ScaleM = FlatmmScalePointer<-1>, class ScaleN = FlatmmScalePointer<-1>, class ExpertBias = FlatmmScalePointer<-1>>
| const ck_tile::index_t ck_tile::MoeFlatmmHostArgs< ScaleM, ScaleN, ExpertBias >::k_padded_zeros |
◆ n_padded_zeros
template<class ScaleM = FlatmmScalePointer<-1>, class ScaleN = FlatmmScalePointer<-1>, class ExpertBias = FlatmmScalePointer<-1>>
| const ck_tile::index_t ck_tile::MoeFlatmmHostArgs< ScaleM, ScaleN, ExpertBias >::n_padded_zeros |
◆ NumExperts
template<class ScaleM = FlatmmScalePointer<-1>, class ScaleN = FlatmmScalePointer<-1>, class ExpertBias = FlatmmScalePointer<-1>>
| ck_tile::index_t ck_tile::MoeFlatmmHostArgs< ScaleM, ScaleN, ExpertBias >::NumExperts |
◆ NumTokens
template<class ScaleM = FlatmmScalePointer<-1>, class ScaleN = FlatmmScalePointer<-1>, class ExpertBias = FlatmmScalePointer<-1>>
| ck_tile::index_t ck_tile::MoeFlatmmHostArgs< ScaleM, ScaleN, ExpertBias >::NumTokens |
◆ p_max_token_id
template<class ScaleM = FlatmmScalePointer<-1>, class ScaleN = FlatmmScalePointer<-1>, class ExpertBias = FlatmmScalePointer<-1>>
| const ck_tile::index_t* ck_tile::MoeFlatmmHostArgs< ScaleM, ScaleN, ExpertBias >::p_max_token_id |
◆ p_sorted_expert_ids
template<class ScaleM = FlatmmScalePointer<-1>, class ScaleN = FlatmmScalePointer<-1>, class ExpertBias = FlatmmScalePointer<-1>>
| const ck_tile::index_t* ck_tile::MoeFlatmmHostArgs< ScaleM, ScaleN, ExpertBias >::p_sorted_expert_ids |
◆ p_sorted_expert_weights
template<class ScaleM = FlatmmScalePointer<-1>, class ScaleN = FlatmmScalePointer<-1>, class ExpertBias = FlatmmScalePointer<-1>>
| const void* ck_tile::MoeFlatmmHostArgs< ScaleM, ScaleN, ExpertBias >::p_sorted_expert_weights |
◆ p_sorted_token_ids
template<class ScaleM = FlatmmScalePointer<-1>, class ScaleN = FlatmmScalePointer<-1>, class ExpertBias = FlatmmScalePointer<-1>>
| const ck_tile::index_t* ck_tile::MoeFlatmmHostArgs< ScaleM, ScaleN, ExpertBias >::p_sorted_token_ids |
◆ TopK
template<class ScaleM = FlatmmScalePointer<-1>, class ScaleN = FlatmmScalePointer<-1>, class ExpertBias = FlatmmScalePointer<-1>>
| ck_tile::index_t ck_tile::MoeFlatmmHostArgs< ScaleM, ScaleN, ExpertBias >::TopK |
The documentation for this struct was generated from the following file: