/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-6.4.3/include/ck/tensor_operation/gpu/block/thread_group_tensor_slice_transfer_v6r2.hpp Source File#
thread_group_tensor_slice_transfer_v6r2.hpp
Go to the documentation of this file.
Definition: ck.hpp:264
__host__ constexpr __device__ auto make_multi_index(Xs &&... xs)
Definition: array_multi_index.hpp:15
typename remove_reference< T >::type remove_reference_t
Definition: type.hpp:292
__host__ constexpr __device__ auto make_zero_multi_index()
Definition: array_multi_index.hpp:21
__host__ constexpr __device__ auto make_cluster_descriptor(const Lengths &lengths, ArrangeOrder order=typename arithmetic_sequence_gen< 0, Lengths::Size(), 1 >::type{})
Definition: cluster_descriptor.hpp:13
Definition: array.hpp:14
Definition: thread_group_tensor_slice_transfer_v6r2.hpp:37
__device__ void MoveDstSliceWindow(const DstDesc &dst_desc, const Index &step)
Definition: thread_group_tensor_slice_transfer_v6r2.hpp:125
static constexpr index_t nDim
Definition: thread_group_tensor_slice_transfer_v6r2.hpp:38
constexpr __device__ ThreadGroupTensorSliceTransfer_v6r2(const Src0Desc &src0_desc, const Index &src0_block_slice_origin, const Src1Desc &src1_desc, const Index &src1_block_slice_origin, const DstDesc &dst_desc, const Index &dst_block_slice_origin, const ElementwiseOperation &element_op)
Definition: thread_group_tensor_slice_transfer_v6r2.hpp:44
static constexpr auto thread_slice_lengths
Definition: thread_group_tensor_slice_transfer_v6r2.hpp:40
__device__ void MoveSrc1SliceWindow(const Src1Desc &src1_desc, const Index &step)
Definition: thread_group_tensor_slice_transfer_v6r2.hpp:116
__device__ void MoveSrc0SliceWindow(const Src0Desc &src0_desc, const Index &step)
Definition: thread_group_tensor_slice_transfer_v6r2.hpp:107
__device__ void Run(const Src0Desc &src0_desc, const Src0Buffer &src0_buf, const Src1Desc &src1_desc, const Src1Buffer &src1_buf, const DstDesc &dst_desc, DstBuffer &dst_buf)
Definition: thread_group_tensor_slice_transfer_v6r2.hpp:93
__device__ void SetSrc0SliceOrigin(const Src0Desc &src0_desc, const Index &src0_slice_origin_idx)
Definition: threadwise_tensor_slice_transfer_v6r2.hpp:68
__device__ void SetSrc1SliceOrigin(const Src1Desc &src1_desc, const Index &src1_slice_origin_idx)
Definition: threadwise_tensor_slice_transfer_v6r2.hpp:74
__device__ void SetDstSliceOrigin(const DstDesc &dst_desc, const Index &dst_slice_origin_idx)
Definition: threadwise_tensor_slice_transfer_v6r2.hpp:80
__device__ void MoveSrc0SliceWindow(const Src0Desc &src0_desc, const Index &src0_slice_origin_step_idx)
Definition: threadwise_tensor_slice_transfer_v6r2.hpp:209
__device__ void Run(const Src0Desc &src0_desc, const Src0Buffer &src0_buf, const Src1Desc &src1_desc, const Src1Buffer &src1_buf, const DstDesc &dst_desc, DstBuffer &dst_buf)
Definition: threadwise_tensor_slice_transfer_v6r2.hpp:86
__device__ void MoveSrc1SliceWindow(const Src1Desc &src1_desc, const Index &src1_slice_origin_step_idx)
Definition: threadwise_tensor_slice_transfer_v6r2.hpp:224
__device__ void MoveDstSliceWindow(const DstDesc &dst_desc, const Index &dst_slice_origin_step_idx)
Definition: threadwise_tensor_slice_transfer_v6r2.hpp:239
Definition: type.hpp:177