/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-6.4.3/include/ck_tile/ops/epilogue/default_2d_epilogue.hpp Source File#
default_2d_epilogue.hpp
Go to the documentation of this file.
Definition: cluster_descriptor.hpp:13
typename impl::WarpGemmMfmaDispatcher< AType, BType, CType, MPerWave, NPerWave, KPerWave, TransposeC, SwizzleA >::Type WarpGemmMfmaDispatcher
Definition: warp_gemm_dispatcher.hpp:81
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition: type_traits.hpp:20
CK_TILE_DEVICE void buffer_store_fence(index_t cnt=0)
Definition: amd_buffer_addressing.hpp:867
CK_TILE_DEVICE void store_tile_raw(tile_window_with_static_lengths< BottomTensorView_, WindowLengths_ > &tile_window_tmp, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor)
Definition: store_tile.hpp:46
CK_TILE_DEVICE void update_tile(tile_window_with_static_lengths< BottomTensorView_, WindowLengths_ > &tile_window_tmp, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor)
Definition: update_tile.hpp:22
CK_TILE_DEVICE void store_tile(tile_window_with_static_lengths< BottomTensorView_, WindowLengths_ > &tile_window_tmp, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor)
Definition: store_tile.hpp:23
CK_TILE_DEVICE void update_tile_raw(tile_window_with_static_distribution< BottomTensorView_, WindowLengths_, TileDistribution_, NumCoord > &tile_window, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor, number< i_access >={}, bool_constant< oob_conditional_check >={}, bool_constant< pre_nop >={})
Definition: update_tile.hpp:68
Definition: default_2d_epilogue.hpp:50
remove_cvref_t< typename Problem::ODataType > ODataType
Definition: default_2d_epilogue.hpp:53
CK_TILE_DEVICE auto operator()(ODramWindowTmp &o_dram_window_tmp, const OAccTile &o_acc_tile, void *=nullptr)
Definition: default_2d_epilogue.hpp:66
remove_cvref_t< Problem_ > Problem
Definition: default_2d_epilogue.hpp:51
remove_cvref_t< typename Problem::AccDataType > AccDataType
Definition: default_2d_epilogue.hpp:52
static constexpr bool UseRawStore
Definition: default_2d_epilogue.hpp:56
static constexpr CK_TILE_HOST_DEVICE index_t GetSmemSize()
Definition: default_2d_epilogue.hpp:58
Definition: default_2d_epilogue.hpp:20
remove_cvref_t< ODataType_ > ODataType
Definition: default_2d_epilogue.hpp:22
static constexpr bool kPadM
Definition: default_2d_epilogue.hpp:23
remove_cvref_t< AccDataType_ > AccDataType
Definition: default_2d_epilogue.hpp:21
static constexpr bool kPadN
Definition: default_2d_epilogue.hpp:24
static constexpr bool UseRawStore
Definition: default_2d_epilogue.hpp:25
Definition: default_2d_epilogue.hpp:98
remove_cvref_t< typename Problem::AccDataType > AccDataType
Definition: default_2d_epilogue.hpp:100
static constexpr index_t kMPerXdl
Definition: default_2d_epilogue.hpp:103
WarpGemmMfmaDispatcher< ODataType, ODataType, AccDataType, kMPerXdl, kNPerXdl, kKPerXdl, isCTransposed > WG
Definition: default_2d_epilogue.hpp:114
static constexpr index_t kNPerXdl
Definition: default_2d_epilogue.hpp:104
static constexpr index_t kKPerXdl
Definition: default_2d_epilogue.hpp:105
static constexpr CK_TILE_HOST_DEVICE auto GetVectorSizeC()
Definition: default_2d_epilogue.hpp:118
static constexpr index_t isCTransposed
Definition: default_2d_epilogue.hpp:106
remove_cvref_t< typename Problem::CLayout > CLayout
Definition: default_2d_epilogue.hpp:102
remove_cvref_t< typename Problem::ODataType > ODataType
Definition: default_2d_epilogue.hpp:101
typename WG::CWarpDstr CWarpDstr
Definition: default_2d_epilogue.hpp:116
remove_cvref_t< Problem_ > Problem
Definition: default_2d_epilogue.hpp:99
Definition: default_2d_epilogue.hpp:40
static constexpr index_t isCTransposed
Definition: default_2d_epilogue.hpp:45
static constexpr index_t kKPerXdl
Definition: default_2d_epilogue.hpp:44
remove_cvref_t< CLayout_ > CLayout
Definition: default_2d_epilogue.hpp:41
static constexpr index_t kMPerXdl
Definition: default_2d_epilogue.hpp:42
static constexpr index_t kNPerXdl
Definition: default_2d_epilogue.hpp:43
Definition: integral_constant.hpp:13