#include <gridwise_tensor_rearrange.hpp>
|
static __device__ void | Run (const InputGridDesc &in_grid_desc, const InputDataType *__restrict__ p_in_global, const OutputGridDesc &out_grid_desc, OutputDataType *__restrict__ p_out_global, const index_t batch_count, const Block2ETileMap &block_2_tile_map, const ComputePtrOffsetOfStridedBatch &compute_ptr_offset_of_batch) |
|
static constexpr __host__ bool | CheckValidity (const InputGridDesc &in_grid_desc, const OutputGridDesc &out_grid_desc) |
|
◆ ThisThreadBlock
template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch >
using ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::ThisThreadBlock = ThisThreadBlock<BlockSize> |
◆ CheckValidity()
template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch >
static constexpr __host__ bool ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::CheckValidity |
( |
const InputGridDesc & |
in_grid_desc, |
|
|
const OutputGridDesc & |
out_grid_desc |
|
) |
| |
|
inlinestaticconstexpr |
◆ Run()
template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch >
static __device__ void ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::Run |
( |
const InputGridDesc & |
in_grid_desc, |
|
|
const InputDataType *__restrict__ |
p_in_global, |
|
|
const OutputGridDesc & |
out_grid_desc, |
|
|
OutputDataType *__restrict__ |
p_out_global, |
|
|
const index_t |
batch_count, |
|
|
const Block2ETileMap & |
block_2_tile_map, |
|
|
const ComputePtrOffsetOfStridedBatch & |
compute_ptr_offset_of_batch |
|
) |
| |
|
inlinestatic |
◆ I0
template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch >
constexpr auto ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::I0 = Number<0>{} |
|
staticconstexpr |
◆ I1
template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch >
constexpr auto ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::I1 = Number<1>{} |
|
staticconstexpr |
The documentation for this struct was generated from the following file:
- /home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-6.4.3/include/ck/tensor_operation/gpu/grid/gridwise_tensor_rearrange.hpp