/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-6.4.3/include/ck_tile/ops/layernorm2d/pipeline/layernorm2d_fwd_pipeline_two_pass.hpp Source File#
layernorm2d_fwd_pipeline_two_pass.hpp
Go to the documentation of this file.
Definition: cluster_descriptor.hpp:13
constexpr CK_TILE_HOST_DEVICE auto integer_divide_ceil(X x, Y y)
Definition: math.hpp:149
CK_TILE_DEVICE auto tile_elementwise_in(const InElementFunc &in_element_func, const InTensor &... in_dstr_tensors)
Definition: tile_elementwise.hpp:40
@ DYNAMIC_QUANT
@ ADD_BIAS
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition: type_traits.hpp:20
constexpr CK_TILE_DEVICE void block_tile_welford_post_scale_var(VarDistributedTensor_ &var_tensor, int count, bool_constant< FastFdiv_ >={})
Definition: block_norm_reduce.hpp:393
CK_TILE_DEVICE auto load_tile(const tile_window_with_static_distribution< BottomTensorView_, WindowLengths_, TileDistribution_, NumCoord > &tile_window, number< i_access >={}, bool_constant< oob_conditional_check >={})
Definition: load_tile.hpp:27
@ PRE_ADD_STORE
constexpr CK_TILE_DEVICE auto make_tile_window(null_tensor_view, const WindowLengths &window_lengths, const multi_index< WindowLengths::size()> &, Ts &&...)
Definition: null_tile_window.hpp:72
CK_TILE_DEVICE void move_tile_window(null_tile_window< WindowLengths > &, const typename null_tile_window< WindowLengths >::BottomTensorIndex &)
Definition: null_tile_window.hpp:92
constexpr CK_TILE_HOST_DEVICE auto make_tuple(Xs &&... xs)
Definition: tuple.hpp:337
CK_TILE_DEVICE void store_tile(tile_window_with_static_lengths< BottomTensorView_, WindowLengths_ > &tile_window_tmp, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor)
Definition: store_tile.hpp:23
constexpr CK_TILE_HOST_DEVICE void sweep_tile(const F &f, UnpacksPerXDim={})
Definition: sweep_tile.hpp:231
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:15
static constexpr auto kXbias
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:41
static constexpr bool kHasBeta
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:32
static constexpr bool kWelford
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:40
static constexpr CK_TILE_HOST_DEVICE index_t GetSmemSize()
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:52
ck_tile::remove_cvref_t< typename Problem::XBiasDataType > XBiasDataType
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:20
XDataType XResidualDataType
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:28
static constexpr bool kSaveInvStd
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:34
CK_TILE_DEVICE auto operator()(const XWindow &x_window_, const XResidualWindow &x_residual_window_, const XBiasWindow &x_bias_window_, const GammaWindow &gamma_window_, const BetaWindow &beta_window_, YWindow &y_window, const YResidualWindow &y_residual_window_, MeanWindow &mean_window, InvStdWindow &inv_std_window, const SmoothScaleWindow &, YScaleWindow &, ComputeDataType epsilon, ck_tile::index_t row_size, void *smem, Epilogue) const
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:69
ck_tile::remove_cvref_t< typename Problem::BetaDataType > BetaDataType
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:22
static constexpr auto kFusedQuant
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:43
static constexpr bool kHasGamma
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:31
ck_tile::remove_cvref_t< typename Problem::GammaDataType > GammaDataType
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:21
ck_tile::remove_cvref_t< Problem_ > Problem
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:16
ck_tile::remove_cvref_t< typename Problem::ComputeDataType > ComputeDataType
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:23
static constexpr bool kFastFDiv
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:39
XDataType YResidualDataType
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:29
ck_tile::remove_cvref_t< typename Problem::InvStdDataType > InvStdDataType
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:26
static constexpr bool kSaveMean
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:33
static constexpr bool kPadM
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:37
ck_tile::remove_cvref_t< typename Problem::YDataType > YDataType
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:24
static constexpr bool kPadN
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:38
static constexpr auto kFusedAdd
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:42
ck_tile::remove_cvref_t< Policy_ > Policy
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:17
ck_tile::remove_cvref_t< typename Problem::XDataType > XDataType
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:19
static constexpr bool kNeedCrossWarpSync
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:36
static constexpr const char * name
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:45
ck_tile::remove_cvref_t< typename Problem::MeanDataType > MeanDataType
Definition: layernorm2d_fwd_pipeline_two_pass.hpp:25
Definition: integral_constant.hpp:13