GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch > Struct Template Reference

GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch > Struct Template Reference#

Composable Kernel: ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch > Struct Template Reference

#include <gridwise_tensor_rearrange.hpp>

Public Types
using	ThisThreadBlock = ThisThreadBlock< BlockSize >

Static Public Member Functions
static __device__ void	Run (const InputGridDesc &in_grid_desc, const InputDataType __restrict__ p_in_global, const OutputGridDesc &out_grid_desc, OutputDataType __restrict__ p_out_global, const index_t batch_count, const Block2ETileMap &block_2_tile_map, const ComputePtrOffsetOfStridedBatch &compute_ptr_offset_of_batch)

static constexpr __host__ bool	CheckValidity (const InputGridDesc &in_grid_desc, const OutputGridDesc &out_grid_desc)

Static Public Attributes
static constexpr auto	I0 = Number<0>{}

static constexpr auto	I1 = Number<1>{}

Member Typedef Documentation

◆ ThisThreadBlock

template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch >

using ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::ThisThreadBlock = ThisThreadBlock<BlockSize>

Member Function Documentation

◆ CheckValidity()

template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch >

static constexpr __host__ bool ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::CheckValidity	(	const InputGridDesc &	in_grid_desc,
		const OutputGridDesc &	out_grid_desc
	)

inlinestaticconstexpr

◆ Run()

template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch >

static __device__ void ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::Run	(	const InputGridDesc &	in_grid_desc,
		const InputDataType *__restrict__	p_in_global,
		const OutputGridDesc &	out_grid_desc,
		OutputDataType *__restrict__	p_out_global,
		const index_t	batch_count,
		const Block2ETileMap &	block_2_tile_map,
		const ComputePtrOffsetOfStridedBatch &	compute_ptr_offset_of_batch
	)

inlinestatic

Member Data Documentation

◆ I0

template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch >

constexpr auto ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::I0 = Number<0>{}

staticconstexpr

◆ I1

template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch >

constexpr auto ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::I1 = Number<1>{}

staticconstexpr

The documentation for this struct was generated from the following file:

/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-6.4.3/include/ck/tensor_operation/gpu/grid/gridwise_tensor_rearrange.hpp

GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch > Struct Template Reference

GridwiseTensorRearrange&lt; InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch &gt; Struct Template Reference#

Public Types

Static Public Member Functions

Static Public Attributes

Member Typedef Documentation

◆ ThisThreadBlock

Member Function Documentation

◆ CheckValidity()

◆ Run()

Member Data Documentation

◆ I0

◆ I1

GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch > Struct Template Reference#