#include <moe_flatmm_pipeline_agmem_bgmem_creg.hpp>
|
| template<typename ADramBlockWindowTmp, typename AElementFunction, typename BFlatBlockWindowTmp, int IsGateUpMode> |
| CK_TILE_HOST_DEVICE auto | operator() (const ADramBlockWindowTmp &a_dram_block_window_tmp, const AElementFunction &a_element_func, const BFlatBlockWindowTmp &b_flat_dram_block_window_tmp, number< IsGateUpMode >, index_t num_loop, void *p_smem_ping, void *p_smem_pong) const |
| template<typename ADramBlockWindowTmp, typename BFlatBlockWindowTmp, int IsGateUpMode> |
| CK_TILE_DEVICE auto | operator() (const ADramBlockWindowTmp &a_dram_block_window_tmp, const BFlatBlockWindowTmp &b_flat_dram_block_window_tmp, number< IsGateUpMode > is_gate_up_mode, index_t num_loop, void *p_smem_ping, void *p_smem_pong) const |
◆ ADataType
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ ALayout
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ BDataType
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ BLayout
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ BlockFlatmm
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
Initial value:
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition type_traits.hpp:21
◆ BlockGemmShape
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ BlockTile
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ BlockWarps
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ CDataType
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ CLayout
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ WarpTile
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ WG
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ GetADramTileDistribution()
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ GetName()
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ GetSmemSize()
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ GetVectorSizeA()
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ GetVectorSizeB()
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ GetVectorSizeC()
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ HotLoopScheduler()
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ Last2ndHotLoopScheduler()
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ LastHotLoopScheduler()
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ operator()() [1/2]
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
template<typename ADramBlockWindowTmp, typename AElementFunction, typename BFlatBlockWindowTmp, int IsGateUpMode>
◆ operator()() [2/2]
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
template<typename ADramBlockWindowTmp, typename BFlatBlockWindowTmp, int IsGateUpMode>
◆ SchedulerPerM()
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ TransposeC()
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ AK1
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ Aload_num_perK
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ Aload_rep
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ BK1
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ Bload_num_perK
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ Bload_rep
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ BlockSize
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ config
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
Initial value:=
BlockFlatmm::BlockPolicy::template GetWarpGemmMWarpNWarp<Problem>()
◆ DoubleSmemBuffer
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ dsread_num_perK
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ dsread_per_wg
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
Initial value:=
remove_cvref_t< typename Problem::ADataType > ADataType
Definition flatmm_pipeline_agmem_bgmem_creg_v1.hpp:48
static constexpr index_t WaveSize
Definition flatmm_pipeline_agmem_bgmem_creg_v1.hpp:69
◆ DsReadPreload
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ dswrite_kIter
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ dswrite_mIter
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ dswrite_num_perK
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ dswrite_rep
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ DsWritePreIssue
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ flatKPerWarp
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ flatNPerWarp
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ HalfMIter
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ HasHotLoop
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ I0
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ I1
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ I2
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ idxK
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ idxM
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ idxN
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ KFlatPerBlockPerIter
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ KIterPerWarp
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ kKPerBlock
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ kLdsAlignmentInBytes
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ kMPerBlock
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ kNPerBlock
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ kPadK
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ kPadM
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ kPadN
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ KPerBlockPerIter
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ m_preload
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
Initial value:
static constexpr index_t MIterPerWarp
Definition flatmm_pipeline_agmem_bgmem_creg_v1.hpp:103
static constexpr index_t KIterPerWarp
Definition flatmm_pipeline_agmem_bgmem_creg_v1.hpp:105
static constexpr index_t DsReadPreload
Definition flatmm_pipeline_agmem_bgmem_creg_v1.hpp:66
◆ mfma_per_wg
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ mfma_perM_perK
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ MIterPerWarp
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ MPerBlockPerIter
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ MWarp
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ MXFP4PackedSize
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ NFlatPerBlockPerIter
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ NIterPerWarp
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ NumWaveGroups
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ NWarp
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ TailNum
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ UsePersistentKernel
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
◆ WaveSize
template<typename Problem, typename PipelinePolicy = UniversalFlatmmPipelineAgBgCrPolicy>
The documentation for this struct was generated from the following file: