BlockNormReduceCrossWarpSync< Problem_, Policy_ > Struct Template Reference#
Public Types |
Public Member Functions |
Static Public Member Functions |
Static Public Attributes |
List of all members
ck_tile::BlockNormReduceCrossWarpSync< Problem_, Policy_ > Struct Template Reference
#include <block_norm_reduce.hpp>
Public Types | |
| using | Problem = remove_cvref_t< Problem_ > |
| using | BlockShape = typename Problem::BlockShape |
| using | smem_dtype = std::conditional_t< kWelford, fp32x4_t, fp32x2_t > |
Public Member Functions | |
| template<typename MeanDistributedTensor_ , typename VarDistributedTensor_ > | |
| CK_TILE_DEVICE void | operator() (MeanDistributedTensor_ &mean_tensor, VarDistributedTensor_ &var_tensor, int &count, void *smem) |
Static Public Member Functions | |
| template<typename MeanDistributedTensor_ > | |
| static constexpr CK_TILE_DEVICE index_t | GetReduceWarps () |
| template<typename MeanDistributedTensor_ > | |
| static constexpr CK_TILE_HOST_DEVICE index_t | GetSmemSize () |
Static Public Attributes | |
| static constexpr bool | kFastFDiv = Problem::kFastFDiv |
| static constexpr bool | kWelford = Problem::kWelford |
Member Typedef Documentation
◆ BlockShape
template<typename Problem_ , typename Policy_ = void>
| using ck_tile::BlockNormReduceCrossWarpSync< Problem_, Policy_ >::BlockShape = typename Problem::BlockShape |
◆ Problem
template<typename Problem_ , typename Policy_ = void>
| using ck_tile::BlockNormReduceCrossWarpSync< Problem_, Policy_ >::Problem = remove_cvref_t<Problem_> |
◆ smem_dtype
template<typename Problem_ , typename Policy_ = void>
| using ck_tile::BlockNormReduceCrossWarpSync< Problem_, Policy_ >::smem_dtype = std::conditional_t<kWelford, fp32x4_t, fp32x2_t> |
Member Function Documentation
◆ GetReduceWarps()
template<typename Problem_ , typename Policy_ = void>
template<typename MeanDistributedTensor_ >
|
inlinestaticconstexpr |
◆ GetSmemSize()
template<typename Problem_ , typename Policy_ = void>
template<typename MeanDistributedTensor_ >
|
inlinestaticconstexpr |
◆ operator()()
template<typename Problem_ , typename Policy_ = void>
template<typename MeanDistributedTensor_ , typename VarDistributedTensor_ >
|
inline |
Member Data Documentation
◆ kFastFDiv
template<typename Problem_ , typename Policy_ = void>
|
staticconstexpr |
◆ kWelford
template<typename Problem_ , typename Policy_ = void>
|
staticconstexpr |
The documentation for this struct was generated from the following file:
- /home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-6.4.3/include/ck_tile/ops/norm_reduce/block/block_norm_reduce.hpp