BaseAQuantGemmPipelineAgBgCrMem< Problem > Struct Template Reference#
ck_tile::BaseAQuantGemmPipelineAgBgCrMem< Problem > Struct Template Reference
#include <gemm_aquant_pipeline_ag_bg_cr_mem.hpp>
Inheritance diagram for ck_tile::BaseAQuantGemmPipelineAgBgCrMem< Problem >:
Static Public Member Functions | |
| static CK_TILE_HOST_DEVICE constexpr TailNumber | GetBlockLoopTailNum (index_t num_loop) |
| template<typename RunFunction> | |
| static CK_TILE_HOST_DEVICE auto | TailHandler (const RunFunction &run_func, bool has_hot_loop, TailNumber tail_number) |
| Static Public Member Functions inherited from ck_tile::BaseGemmPipelineAgBgCrMem< Problem > | |
| static CK_TILE_HOST_DEVICE constexpr auto | TransposeC () |
| static CK_TILE_HOST_DEVICE constexpr bool | BlockHasHotloop (index_t num_loop) |
| static CK_TILE_HOST_DEVICE constexpr TailNumber | GetBlockLoopTailNum (index_t num_loop) |
| template<typename RunFunction> | |
| static CK_TILE_HOST_DEVICE auto | TailHandler (const RunFunction &run_func, bool has_hot_loop, TailNumber tail_number) |
Additional Inherited Members | |
| Public Types inherited from ck_tile::BaseGemmPipelineAgBgCrMem< Problem > | |
| using | ADataType = remove_cvref_t<typename Problem::ADataType> |
| using | BDataType = remove_cvref_t<typename Problem::BDataType> |
| using | BlockGemmShape = remove_cvref_t<typename Problem::BlockGemmShape> |
| Static Public Attributes inherited from ck_tile::BaseGemmPipelineAgBgCrMem< Problem > | |
| static constexpr index_t | APackedSize |
| static constexpr index_t | BPackedSize |
| static constexpr index_t | BlockSize = Problem::kBlockSize |
| static constexpr index_t | MPerBlock = BlockGemmShape::kM |
| static constexpr index_t | NPerBlock = BlockGemmShape::kN |
| static constexpr index_t | KPerBlock = BlockGemmShape::kK |
| static constexpr index_t | MinMemInFlyBytes = 32768 |
| static constexpr index_t | WgpPerCU |
| static constexpr index_t | FullMemBandPrefetchStages |
| static constexpr index_t | PrefetchStages |
| static constexpr index_t | LocalPrefillStages = 1 |
| static constexpr index_t | GlobalBufferNum = PrefetchStages |
| static constexpr bool | UsePersistentKernel = Problem::Traits::UsePersistentKernel |
Member Function Documentation
◆ GetBlockLoopTailNum()
template<typename Problem>
|
inlinestaticconstexpr |
◆ TailHandler()
template<typename Problem>
template<typename RunFunction>
|
inlinestatic |
The documentation for this struct was generated from the following file: