reference_rmsnorm2d_fwd.hpp Source File#
reference_rmsnorm2d_fwd.hpp
Go to the documentation of this file.
Definition tile/core/algorithm/cluster_descriptor.hpp:13
CK_TILE_HOST auto make_ParallelTensorFunctor(F f, Xs... xs)
Definition tile/host/host_tensor.hpp:329
CK_TILE_HOST_DEVICE constexpr bfloat16_t float_to_bf16(float f, constant< rounding >={})
Definition bfloat16.hpp:284
@ NO_SPECIFIC_MODEL
Definition rmsnorm2d_fwd_traits.hpp:42
void reference_rmsnorm2d_fwd(const HostTensor< XDataType > &x_m_n, const HostTensor< GammaDataType > &gamma_n, HostTensor< YDataType > &y_m_n, HostTensor< InvRmsDataType > &invRms_m, HostTensor< UnquantYDataType > &unquant_y_m_n, ComputeDataType epsilon, Epilogue epilogue_functor={}, const int use_model_sensitive_rmsnorm=static_cast< int >(Rmsnorm2dSensitiveEnum::NO_SPECIFIC_MODEL))
Definition reference_rmsnorm2d_fwd.hpp:41
CK_TILE_HOST_DEVICE constexpr Y type_convert(X x)
Definition tile/core/numeric/type_convert.hpp:29
const std::vector< std::size_t > & get_lengths() const
Definition tile/host/host_tensor.hpp:198
Definition tile/host/host_tensor.hpp:336
decltype(auto) get_lengths() const
Definition tile/host/host_tensor.hpp:390
decltype(auto) get_strides() const
Definition tile/host/host_tensor.hpp:394
Definition reference_rmsnorm2d_fwd.hpp:14
auto operator()(int m, const HostTensor< AccDataType > &acc)
Definition reference_rmsnorm2d_fwd.hpp:26
void operator()(int m, HostTensor< OutDataType > &o, const HostTensor< AccDataType > &acc)
Definition reference_rmsnorm2d_fwd.hpp:16