generic_memory_space_atomic.hpp Source File#
tile/core/arch/generic_memory_space_atomic.hpp
Go to the documentation of this file.
96// intentionally have only declaration but no definition to cause compilation failure when trying to
97// instantiate this template. The purpose is to make the implementation of atomic_add explicit for
Definition tile/core/algorithm/cluster_descriptor.hpp:13
CK_TILE_DEVICE void atomic_add< bf16x2_t >(bf16x2_t *p_dst, const bf16x2_t &x)
Definition tile/core/arch/generic_memory_space_atomic.hpp:103
CK_TILE_DEVICE void atomic_add(X *p_dst, const X &x)
CK_TILE_DEVICE void atomic_add_g(T *p_dst, const thread_buffer< T, N > &x)
Definition tile/core/arch/generic_memory_space_atomic.hpp:358
CK_TILE_DEVICE void atomic_add< fp8x8_t >(fp8x8_t *p_dst, fp8x8_t const &x)
Definition tile/core/arch/generic_memory_space_atomic.hpp:243
CK_TILE_HOST_DEVICE fp8x8_t add_fp8x8_t(const fp8x8_t &a, const fp8x8_t &b)
Definition tile/core/arch/generic_memory_space_atomic.hpp:57
CK_TILE_HOST_DEVICE T add(const T &a, const T &b)
Definition tile/core/arch/generic_memory_space_atomic.hpp:16
CK_TILE_DEVICE void atomic_add< bf16x4_t >(bf16x4_t *p_dst, bf16x4_t const &x)
Definition tile/core/arch/generic_memory_space_atomic.hpp:134
CK_TILE_HOST_DEVICE bf8x8_t add_bf8x8_t(const bf8x8_t &a, const bf8x8_t &b)
Definition tile/core/arch/generic_memory_space_atomic.hpp:81
CK_TILE_HOST_DEVICE fp8x4_t add_fp8x4_t(const fp8x4_t &a, const fp8x4_t &b)
Definition tile/core/arch/generic_memory_space_atomic.hpp:47
CK_TILE_DEVICE void atomic_add< fp8x4_t >(fp8x4_t *p_dst, const fp8x4_t &x)
Definition tile/core/arch/generic_memory_space_atomic.hpp:176
CK_TILE_HOST_DEVICE PY c_style_pointer_cast(PX p_x)
Definition type_traits.hpp:104
CK_TILE_HOST_DEVICE bf16x2_t add_bf16x2_t(const bf16x2_t &a, const bf16x2_t &b)
Definition tile/core/arch/generic_memory_space_atomic.hpp:21
CK_TILE_DEVICE void atomic_add< fp16x2_t >(fp16x2_t *p_dst, fp16x2_t const &x)
Definition tile/core/arch/generic_memory_space_atomic.hpp:323
CK_TILE_HOST_DEVICE fp16x2_t add_f16x2_t(const fp16x2_t &a, const fp16x2_t &b)
Definition tile/core/arch/generic_memory_space_atomic.hpp:39
CK_TILE_HOST_DEVICE constexpr Y type_convert(X x)
Definition tile/core/numeric/type_convert.hpp:29
CK_TILE_DEVICE void atomic_max_g(T *p_dst, const thread_buffer< T, N > &x)
Definition tile/core/arch/generic_memory_space_atomic.hpp:479
CK_TILE_HOST_DEVICE bf16x4_t add_bf16x4_t(const bf16x4_t &a, const bf16x4_t &b)
Definition tile/core/arch/generic_memory_space_atomic.hpp:29
CK_TILE_DEVICE void atomic_add< bf8x4_t >(bf8x4_t *p_dst, const bf8x4_t &x)
Definition tile/core/arch/generic_memory_space_atomic.hpp:208
CK_TILE_HOST_DEVICE bf8x4_t add_bf8x4_t(const bf8x4_t &a, const bf8x4_t &b)
Definition tile/core/arch/generic_memory_space_atomic.hpp:71
CK_TILE_DEVICE void atomic_add< bf8x8_t >(bf8x8_t *p_dst, bf8x8_t const &x)
Definition tile/core/arch/generic_memory_space_atomic.hpp:284
Definition tile/core/utility/functional.hpp:43
Definition tile/core/utility/debug.hpp:67