dpp8_f16_2x32x2 > Struct Reference

dpp8_f16_2x32x2 > Struct Reference#

Composable Kernel: ck::dpp_type< DppInstr::dpp8_f16_2x32x2 > Struct Reference
ck::dpp_type< DppInstr::dpp8_f16_2x32x2 > Struct Reference

#include <dpp_gemm.hpp>

Public Types

using BaseType = half_t

Public Member Functions

template<index_t MPerDpp, index_t NPerDpp, class ADataType, class BDataType, class CDataType>
__device__ void run (const ADataType &a, const BDataType &b, CDataType &reg_c) const

Static Public Attributes

static constexpr index_t wave_size = 32
static constexpr index_t lanegroup_size = 8
static constexpr index_t m_per_wave = 2
static constexpr index_t n_per_wave = 32
static constexpr index_t m_per_lanegroup = 2
static constexpr index_t n_per_lanegroup = 8
static constexpr index_t m_per_thread = 2
static constexpr index_t n_per_thread = 1
static constexpr index_t k_per_dpp = 2
static constexpr bool share_a = true

Member Typedef Documentation

◆ BaseType

Member Function Documentation

◆ run()

template<index_t MPerDpp, index_t NPerDpp, class ADataType, class BDataType, class CDataType>
__device__ void ck::dpp_type< DppInstr::dpp8_f16_2x32x2 >::run ( const ADataType & a,
const BDataType & b,
CDataType & reg_c ) const
inline

Member Data Documentation

◆ k_per_dpp

index_t ck::dpp_type< DppInstr::dpp8_f16_2x32x2 >::k_per_dpp = 2
staticconstexpr

◆ lanegroup_size

index_t ck::dpp_type< DppInstr::dpp8_f16_2x32x2 >::lanegroup_size = 8
staticconstexpr

◆ m_per_lanegroup

index_t ck::dpp_type< DppInstr::dpp8_f16_2x32x2 >::m_per_lanegroup = 2
staticconstexpr

◆ m_per_thread

index_t ck::dpp_type< DppInstr::dpp8_f16_2x32x2 >::m_per_thread = 2
staticconstexpr

◆ m_per_wave

index_t ck::dpp_type< DppInstr::dpp8_f16_2x32x2 >::m_per_wave = 2
staticconstexpr

◆ n_per_lanegroup

index_t ck::dpp_type< DppInstr::dpp8_f16_2x32x2 >::n_per_lanegroup = 8
staticconstexpr

◆ n_per_thread

index_t ck::dpp_type< DppInstr::dpp8_f16_2x32x2 >::n_per_thread = 1
staticconstexpr

◆ n_per_wave

index_t ck::dpp_type< DppInstr::dpp8_f16_2x32x2 >::n_per_wave = 32
staticconstexpr

◆ share_a

bool ck::dpp_type< DppInstr::dpp8_f16_2x32x2 >::share_a = true
staticconstexpr

◆ wave_size

index_t ck::dpp_type< DppInstr::dpp8_f16_2x32x2 >::wave_size = 32
staticconstexpr

The documentation for this struct was generated from the following file: