/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-7.0.0/include/ck_tile/core/tensor/load_tile_transpose.hpp Source File#
load_tile_transpose.hpp
Go to the documentation of this file.
179 static constexpr auto reversed_quad_output_hs_lengthss = tuple_reverse(quad_output_hs_lengthss);
constexpr CK_TILE_HOST_DEVICE auto make_embed_tile_distribution_encoding(OuterDstr, InnerDstr)
Definition: tile_distribution_encoding.hpp:539
constexpr bool is_sequence_suffix_v
Definition: load_tile_transpose.hpp:40
Definition: cluster_descriptor.hpp:13
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition: type_traits.hpp:21
constexpr CK_TILE_HOST_DEVICE auto generate_sequence_v2(F &&f, number< N >)
Definition: sequence.hpp:1036
constexpr CK_TILE_HOST_DEVICE index_t reduce_on_sequence(Seq, Reduce f, number< Init >)
Definition: sequence.hpp:973
CK_TILE_DEVICE auto load_tile_transpose(const tile_window_with_static_distribution< BottomTensorView_, WindowLengths_, TileDistribution_, NumCoord > &tile_window)
transpose loads tile from a tensor and returns the resulting tensor with a new (transposed) tile dist...
Definition: load_tile_transpose.hpp:319
constexpr CK_TILE_HOST_DEVICE auto to_sequence(tuple< number< Is >... >)
Definition: sequence.hpp:1046
constexpr CK_TILE_HOST_DEVICE auto tuple_reverse(const tuple< Ts... > &t)
Definition: tuple.hpp:547
constexpr CK_TILE_HOST_DEVICE auto InputTileDistributionEncoding()
Definition: load_tile_transpose.hpp:267
constexpr CK_TILE_HOST_DEVICE auto generate_tuple(F &&f, number< N >)
Definition: tuple.hpp:406
constexpr CK_TILE_HOST_DEVICE auto make_static_tile_distribution(StaticTileDistributionEncoding_)
Definition: tile_distribution.hpp:498
typename conditional< predicate, X, Y >::type conditional_t
Definition: functional.hpp:115
Definition: load_tile_transpose.hpp:49
Definition: load_tile_transpose.hpp:66
Definition: load_tile_transpose.hpp:101
static constexpr bool dims_valid
Definition: load_tile_transpose.hpp:105
static constexpr index_t ndimp_outer
Definition: load_tile_transpose.hpp:118
static constexpr bool suffix_valid_dim1
Definition: load_tile_transpose.hpp:110
static constexpr auto input_ys_to_rhs_major
Definition: load_tile_transpose.hpp:131
static constexpr auto input_hs_lengthss
Definition: load_tile_transpose.hpp:102
static constexpr auto input_ps_to_rhss_major
Definition: load_tile_transpose.hpp:115
static constexpr bool suffix_valid_dim0
Definition: load_tile_transpose.hpp:107
static constexpr bool ys_mapping_valid
Definition: load_tile_transpose.hpp:134
static constexpr auto input_ys_to_rhs_minor
Definition: load_tile_transpose.hpp:132
static constexpr index_t ndimp_inner
Definition: load_tile_transpose.hpp:119
static constexpr bool ps_mapping_valid
Definition: load_tile_transpose.hpp:122
static constexpr auto input_ps_to_rhss_minor
Definition: load_tile_transpose.hpp:116
static constexpr bool value
Definition: load_tile_transpose.hpp:141
static constexpr auto quad_hs_lengthss
Definition: load_tile_transpose.hpp:103
Definition: load_tile_transpose.hpp:47
static constexpr auto group_func
Definition: load_tile_transpose.hpp:95
std::conditional_t< sizeof(DataType)==2, typename Quad16::OutputEncoding, typename Quad8::OutputEncoding > QuadOutputEncoding
Definition: load_tile_transpose.hpp:89
static constexpr auto transpose_dims
Definition: load_tile_transpose.hpp:92
std::conditional_t< sizeof(DataType)==2, typename Quad16::InputEncoding, typename Quad8::InputEncoding > QuadInputEncoding
Definition: load_tile_transpose.hpp:85
Definition: load_tile_transpose.hpp:161
static constexpr auto quad_ps_to_rhss_minor
Definition: load_tile_transpose.hpp:173
static constexpr auto dst_ys_to_rhs_major
Definition: load_tile_transpose.hpp:247
static constexpr auto input_ps_to_rhss_major
Definition: load_tile_transpose.hpp:167
static constexpr auto swap_one_and_two
Definition: load_tile_transpose.hpp:237
static constexpr auto quad_output_hs_lengthss
Definition: load_tile_transpose.hpp:165
static constexpr auto input_hs_lengthss
Definition: load_tile_transpose.hpp:163
static constexpr auto reversed_quad_output_hs_lengthss
Definition: load_tile_transpose.hpp:179
static constexpr auto input_ps_to_rhss_minor
Definition: load_tile_transpose.hpp:168
typename remove_cvref_t< TileDistribution_ >::DstrEncode InDstrEncode
Definition: load_tile_transpose.hpp:162
static constexpr auto modified_input_ys_to_rhs_major
Definition: load_tile_transpose.hpp:244
static constexpr auto quad_input_hs_lengthss
Definition: load_tile_transpose.hpp:164
static constexpr auto input_ys_to_rhs_minor
Definition: load_tile_transpose.hpp:170
static constexpr auto quad_ps_to_rhss_major
Definition: load_tile_transpose.hpp:172
static constexpr auto input_ys_to_rhs_major
Definition: load_tile_transpose.hpp:169
static constexpr auto dst_out_hs_lengthss
Definition: load_tile_transpose.hpp:192
static constexpr auto dst_ys_to_rhs_minor
Definition: load_tile_transpose.hpp:251
static constexpr auto major_last_index
Definition: load_tile_transpose.hpp:216
static constexpr auto dst_ps_to_rhss_minor
Definition: load_tile_transpose.hpp:218
static constexpr auto minor_last_index
Definition: load_tile_transpose.hpp:214
static constexpr auto dst_ps_to_rhss_major
Definition: load_tile_transpose.hpp:240
static constexpr auto full_out_hs_lengthss
Definition: load_tile_transpose.hpp:181
static constexpr auto modified_ps_to_rhss_major
Definition: load_tile_transpose.hpp:196
Definition: load_tile_transpose.hpp:147
static constexpr bool distr_encoding_valid
Definition: load_tile_transpose.hpp:152
typename Policy::template ValidationTraits< InDstrEncode > Validator
Definition: load_tile_transpose.hpp:150
typename remove_cvref_t< TileDistribution_ >::DstrEncode InDstrEncode
Definition: load_tile_transpose.hpp:148
Definition: sequence.hpp:278
typename std::conditional< kHasContent, type0, type1 >::type type
Definition: sequence.hpp:293
A fixed-size array container similar to std::array with additional utilities.
Definition: array.hpp:43
Definition: integral_constant.hpp:13
Definition: math.hpp:98
Definition: sequence.hpp:52
Definition: functional.hpp:43
Definition: tile_distribution_encoding.hpp:26
This class provides tile (windowed) view and access to the device memory.
Definition: tile_window.hpp:46
Definition: tuple.hpp:192
Definition: load_tile_transpose.hpp:23
typename arithmetic_sequence_gen< start_pos, Sequence::size(), 1 >::type extract_indices
Definition: load_tile_transpose.hpp:27
static constexpr bool value
Definition: load_tile_transpose.hpp:29
static constexpr bool size_check
Definition: load_tile_transpose.hpp:24
static constexpr index_t start_pos
Definition: load_tile_transpose.hpp:26