#include <block_reduce2d.hpp>
|
constexpr CK_TILE_DEVICE | BlockReduce2d () |
|
template<typename XDistributedTensor_ , typename YDistributedTensor_ , typename ReduceFunc , typename ReducePacksPerXDim = uniform_sequence_gen_t<2, 1>> |
CK_TILE_DEVICE void | operator() (const XDistributedTensor_ &x_tensor, YDistributedTensor_ &y_tensor, const ReduceFunc &reduce_func, ReducePacksPerXDim={}) |
|
template<typename XDistributedTensor_ , typename ReduceFunc , typename ReducePacksPerXDim = uniform_sequence_gen_t<2, 1>> |
CK_TILE_DEVICE auto | operator() (const XDistributedTensor_ &x_tensor, const ComputeDataType &reduce_init, const ReduceFunc &reduce_func, ReducePacksPerXDim={}) |
|
◆ ComputeDataType
template<typename Problem_ , typename Policy_ = void>
◆ Problem
template<typename Problem_ , typename Policy_ = void>
◆ XDataType
template<typename Problem_ , typename Policy_ = void>
◆ BlockReduce2d()
template<typename Problem_ , typename Policy_ = void>
◆ MakeYBlockTile()
template<typename Problem_ , typename Policy_ = void>
template<typename XDistributedTensor_ >
◆ operator()() [1/2]
template<typename Problem_ , typename Policy_ = void>
template<typename XDistributedTensor_ , typename ReduceFunc , typename ReducePacksPerXDim = uniform_sequence_gen_t<2, 1>>
◆ operator()() [2/2]
template<typename Problem_ , typename Policy_ = void>
template<typename XDistributedTensor_ , typename YDistributedTensor_ , typename ReduceFunc , typename ReducePacksPerXDim = uniform_sequence_gen_t<2, 1>>
CK_TILE_DEVICE void ck_tile::BlockReduce2d< Problem_, Policy_ >::operator() |
( |
const XDistributedTensor_ & |
x_tensor, |
|
|
YDistributedTensor_ & |
y_tensor, |
|
|
const ReduceFunc & |
reduce_func, |
|
|
ReducePacksPerXDim |
= {} |
|
) |
| |
|
inline |
The documentation for this struct was generated from the following file:
- /home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-6.4.3/include/ck_tile/ops/reduce/block/block_reduce2d.hpp