#include <gridwise_tensor_rearrange.hpp>
 | 
| static __device__ void  | Run (const InputGridDesc &in_grid_desc, const InputDataType *__restrict__ p_in_global, const OutputGridDesc &out_grid_desc, OutputDataType *__restrict__ p_out_global, const index_t batch_count, const Block2ETileMap &block_2_tile_map, const ComputePtrOffsetOfStridedBatch &compute_ptr_offset_of_batch) | 
|   | 
| static constexpr __host__ bool  | CheckValidity (const InputGridDesc &in_grid_desc, const OutputGridDesc &out_grid_desc) | 
|   | 
◆ ThisThreadBlock
template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch > 
      
        
          | using ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::ThisThreadBlock =  ThisThreadBlock<BlockSize> | 
        
      
 
 
◆ CheckValidity()
template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch > 
  
  
      
        
          | static constexpr __host__ bool ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::CheckValidity  | 
          ( | 
          const InputGridDesc &  | 
          in_grid_desc,  | 
         
        
           | 
           | 
          const OutputGridDesc &  | 
          out_grid_desc  | 
         
        
           | 
          ) | 
           |  | 
         
       
   | 
  
inlinestaticconstexpr   | 
  
 
 
◆ Run()
template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch > 
  
  
      
        
          | static __device__ void ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::Run  | 
          ( | 
          const InputGridDesc &  | 
          in_grid_desc,  | 
         
        
           | 
           | 
          const InputDataType *__restrict__  | 
          p_in_global,  | 
         
        
           | 
           | 
          const OutputGridDesc &  | 
          out_grid_desc,  | 
         
        
           | 
           | 
          OutputDataType *__restrict__  | 
          p_out_global,  | 
         
        
           | 
           | 
          const index_t  | 
          batch_count,  | 
         
        
           | 
           | 
          const Block2ETileMap &  | 
          block_2_tile_map,  | 
         
        
           | 
           | 
          const ComputePtrOffsetOfStridedBatch &  | 
          compute_ptr_offset_of_batch  | 
         
        
           | 
          ) | 
           |  | 
         
       
   | 
  
inlinestatic   | 
  
 
 
◆ I0
template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch > 
  
  
      
        
          | constexpr auto ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::I0 = Number<0>{} | 
         
       
   | 
  
staticconstexpr   | 
  
 
 
◆ I1
template<typename InputGridDesc , typename InputDataType , typename OutputGridDesc , typename OutputDataType , index_t BlockSize, index_t MPerBlock, index_t KPerBlock, typename ThreadClusterLengths , index_t ScalarPerVector, InMemoryDataOperationEnum DstInMemOp, typename Block2ETileMap , typename ComputePtrOffsetOfStridedBatch > 
  
  
      
        
          | constexpr auto ck::GridwiseTensorRearrange< InputGridDesc, InputDataType, OutputGridDesc, OutputDataType, BlockSize, MPerBlock, KPerBlock, ThreadClusterLengths, ScalarPerVector, DstInMemOp, Block2ETileMap, ComputePtrOffsetOfStridedBatch >::I1 = Number<1>{} | 
         
       
   | 
  
staticconstexpr   | 
  
 
 
The documentation for this struct was generated from the following file: