BaseGemmPipelineAgBgCrMem< Problem > Struct Template Reference#
ck_tile::BaseGemmPipelineAgBgCrMem< Problem > Struct Template Reference
#include <gemm_pipeline_ag_bg_cr_mem.hpp>
Inheritance diagram for ck_tile::BaseGemmPipelineAgBgCrMem< Problem >:
Public Types | |
| using | ADataType = remove_cvref_t<typename Problem::ADataType> |
| using | BDataType = remove_cvref_t<typename Problem::BDataType> |
| using | BlockGemmShape = remove_cvref_t<typename Problem::BlockGemmShape> |
Static Public Member Functions | |
| static CK_TILE_HOST_DEVICE constexpr auto | TransposeC () |
| static CK_TILE_HOST_DEVICE constexpr bool | BlockHasHotloop (index_t num_loop) |
| static CK_TILE_HOST_DEVICE constexpr TailNumber | GetBlockLoopTailNum (index_t num_loop) |
| template<typename RunFunction> | |
| static CK_TILE_HOST_DEVICE auto | TailHandler (const RunFunction &run_func, bool has_hot_loop, TailNumber tail_number) |
Static Public Attributes | |
| static constexpr index_t | APackedSize |
| static constexpr index_t | BPackedSize |
| static constexpr index_t | BlockSize = Problem::kBlockSize |
| static constexpr index_t | MPerBlock = BlockGemmShape::kM |
| static constexpr index_t | NPerBlock = BlockGemmShape::kN |
| static constexpr index_t | KPerBlock = BlockGemmShape::kK |
| static constexpr index_t | MinMemInFlyBytes = 32768 |
| static constexpr index_t | WgpPerCU |
| static constexpr index_t | FullMemBandPrefetchStages |
| static constexpr index_t | PrefetchStages |
| static constexpr index_t | LocalPrefillStages = 1 |
| static constexpr index_t | GlobalBufferNum = PrefetchStages |
| static constexpr bool | UsePersistentKernel = Problem::Traits::UsePersistentKernel |
Member Typedef Documentation
◆ ADataType
template<typename Problem>
| using ck_tile::BaseGemmPipelineAgBgCrMem< Problem >::ADataType = remove_cvref_t<typename Problem::ADataType> |
◆ BDataType
template<typename Problem>
| using ck_tile::BaseGemmPipelineAgBgCrMem< Problem >::BDataType = remove_cvref_t<typename Problem::BDataType> |
◆ BlockGemmShape
template<typename Problem>
| using ck_tile::BaseGemmPipelineAgBgCrMem< Problem >::BlockGemmShape = remove_cvref_t<typename Problem::BlockGemmShape> |
Member Function Documentation
◆ BlockHasHotloop()
template<typename Problem>
|
inlinestaticconstexpr |
◆ GetBlockLoopTailNum()
template<typename Problem>
|
inlinestaticconstexpr |
◆ TailHandler()
template<typename Problem>
template<typename RunFunction>
|
inlinestatic |
◆ TransposeC()
template<typename Problem>
|
inlinestaticconstexpr |
Member Data Documentation
◆ APackedSize
template<typename Problem>
|
staticconstexpr |
Initial value:
=
ck_tile::numeric_traits<remove_cvref_t<ADataType>>::PackedSize
Definition tile/core/numeric/numeric.hpp:81
◆ BlockSize
template<typename Problem>
|
staticconstexpr |
◆ BPackedSize
template<typename Problem>
|
staticconstexpr |
Initial value:
=
ck_tile::numeric_traits<remove_cvref_t<BDataType>>::PackedSize
◆ FullMemBandPrefetchStages
template<typename Problem>
|
staticconstexpr |
Initial value:
=
CK_TILE_HOST_DEVICE constexpr auto integer_divide_ceil(X x, Y y)
Definition tile/core/numeric/math.hpp:149
static constexpr index_t WgpPerCU
Definition blockwise_gemm_pipeline_xdlops_v2.hpp:146
static constexpr index_t MPerBlock
Definition gemm_pipeline_ag_bg_cr_mem.hpp:32
remove_cvref_t< typename Problem::BDataType > BDataType
Definition gemm_pipeline_ag_bg_cr_mem.hpp:21
static constexpr index_t BPackedSize
Definition gemm_pipeline_ag_bg_cr_mem.hpp:26
remove_cvref_t< typename Problem::ADataType > ADataType
Definition gemm_pipeline_ag_bg_cr_mem.hpp:20
static constexpr index_t MinMemInFlyBytes
Definition gemm_pipeline_ag_bg_cr_mem.hpp:37
static constexpr index_t KPerBlock
Definition gemm_pipeline_ag_bg_cr_mem.hpp:34
static constexpr index_t APackedSize
Definition gemm_pipeline_ag_bg_cr_mem.hpp:24
static constexpr index_t NPerBlock
Definition gemm_pipeline_ag_bg_cr_mem.hpp:33
◆ GlobalBufferNum
template<typename Problem>
|
staticconstexpr |
◆ KPerBlock
template<typename Problem>
|
staticconstexpr |
◆ LocalPrefillStages
template<typename Problem>
|
staticconstexpr |
◆ MinMemInFlyBytes
template<typename Problem>
|
staticconstexpr |
◆ MPerBlock
template<typename Problem>
|
staticconstexpr |
◆ NPerBlock
template<typename Problem>
|
staticconstexpr |
◆ PrefetchStages
template<typename Problem>
|
staticconstexpr |
Initial value:
=
? FullMemBandPrefetchStages <= 8 ? FullMemBandPrefetchStages : 8
: 2
static constexpr index_t FullMemBandPrefetchStages
Definition blockwise_gemm_pipeline_xdlops_v2.hpp:148
◆ UsePersistentKernel
template<typename Problem>
|
staticconstexpr |
◆ WgpPerCU
template<typename Problem>
|
staticconstexpr |
Initial value:
=
static constexpr index_t BlockSize
Definition gemm_pipeline_ag_bg_cr_mem.hpp:31
The documentation for this struct was generated from the following file: