#include <cshuffle_epilogue.hpp>
◆ AccDataType
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| using ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::AccDataType = remove_cvref_t<AccDataType_> |
◆ AsDataType
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| using ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::AsDataType = remove_cvref_t<AsDataType_> |
◆ BsDataType
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| using ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::BsDataType = remove_cvref_t<BsDataType_> |
◆ CDElementwise
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| using ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::CDElementwise = remove_cvref_t<CDElementwise_> |
◆ DsDataType
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| using ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::DsDataType = remove_cvref_t<DsDataType_> |
◆ DsLayout
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| using ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::DsLayout = remove_cvref_t<DsLayout_> |
◆ ELayout
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| using ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::ELayout = remove_cvref_t<ELayout_> |
◆ ODataType
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| using ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::ODataType = remove_cvref_t<ODataType_> |
◆ BlockedXDLN_PerWarp
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| index_t ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::BlockedXDLN_PerWarp = BlockedXDLN_PerWarp_ |
|
staticconstexpr |
◆ FixedVectorSize
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| bool ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::FixedVectorSize = FixedVectorSize_ |
|
staticconstexpr |
◆ isCTransposed
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| index_t ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::isCTransposed = isCTransposed_ |
|
staticconstexpr |
◆ kBlockSize
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| index_t ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::kBlockSize = MWave_ * NWave_ * get_warp_size() |
|
staticconstexpr |
◆ kMPerBlock
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| index_t ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::kMPerBlock = kM_ |
|
staticconstexpr |
◆ kNPerBlock
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| index_t ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::kNPerBlock = kN_ |
|
staticconstexpr |
◆ kNumWaveGroups
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| index_t ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::kNumWaveGroups = kNumWaveGroups_ |
|
staticconstexpr |
◆ KPerXdl
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| index_t ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::KPerXdl = KPerXdl_ |
|
staticconstexpr |
◆ MemoryOperation
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| memory_operation_enum ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::MemoryOperation = MemoryOperation_ |
|
staticconstexpr |
◆ MPerXdl
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| index_t ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::MPerXdl = MPerXdl_ |
|
staticconstexpr |
◆ MWave
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| index_t ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::MWave = MWave_ |
|
staticconstexpr |
◆ NPerXdl
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| index_t ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::NPerXdl = NPerXdl_ |
|
staticconstexpr |
◆ NumDTensor
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| index_t ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::NumDTensor = DsDataType::size() |
|
staticconstexpr |
◆ NWave
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| index_t ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::NWave = NWave_ |
|
staticconstexpr |
◆ TiledMMAPermuteN
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| bool ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::TiledMMAPermuteN = TiledMMAPermuteN_ |
|
staticconstexpr |
◆ VectorSizeC
template<typename AsDataType_, typename BsDataType_, typename DsDataType_, typename AccDataType_, typename ODataType_, typename DsLayout_, typename ELayout_, typename CDElementwise_,
index_t kM_,
index_t kN_,
index_t MWave_,
index_t NWave_,
index_t MPerXdl_,
index_t NPerXdl_,
index_t KPerXdl_, bool isCTransposed_,
memory_operation_enum MemoryOperation_,
index_t kNumWaveGroups_ = 1, bool FixedVectorSize_ = false,
index_t VectorSizeC_ = 1, bool TiledMMAPermuteN_ = false,
index_t BlockedXDLN_PerWarp_ = 1>
| index_t ck_tile::CShuffleEpilogueProblem< AsDataType_, BsDataType_, DsDataType_, AccDataType_, ODataType_, DsLayout_, ELayout_, CDElementwise_, kM_, kN_, MWave_, NWave_, MPerXdl_, NPerXdl_, KPerXdl_, isCTransposed_, MemoryOperation_, kNumWaveGroups_, FixedVectorSize_, VectorSizeC_, TiledMMAPermuteN_, BlockedXDLN_PerWarp_ >::VectorSizeC = VectorSizeC_ |
|
staticconstexpr |
The documentation for this struct was generated from the following file: