/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-6.4.3/include/ck/tensor_operation/gpu/device/welford_helper.hpp Source File#
welford_helper.hpp
Go to the documentation of this file.
Definition: ck.hpp:264
Definition: welford_helper.hpp:12
index_t count_in_last_tile_
Definition: welford_helper.hpp:39
__device__ index_t operator()(index_t thread_k_cluster_id) const
Definition: welford_helper.hpp:20
GetReduceCountPerThreadForBlockwiseWelford(index_t numBlockTileIteration, long_index_t reduce_length)
Definition: welford_helper.hpp:13
index_t numBlockTileIteration_
Definition: welford_helper.hpp:36
Definition: welford_helper.hpp:44
index_t blkGroupSize_
Definition: welford_helper.hpp:78
__device__ index_t operator()(index_t block_local_id, index_t thread_k_cluster_id) const
Definition: welford_helper.hpp:56
index_t numBlockTileIteration_
Definition: welford_helper.hpp:81
index_t numBlockTileIterationByLastBlock_
Definition: welford_helper.hpp:84
GetReduceCountPerThreadForMultiblockWelford(index_t blkGroupSize, index_t numBlockTileIteration, long_index_t reduce_length)
Definition: welford_helper.hpp:45
ck::tensor_operation::device::GetReduceCountPerThreadForMultiblockWelford::last_block_reduce_length_
index_t last_block_reduce_length_
Definition: welford_helper.hpp:83