/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-7.0.0/include/ck_tile/ops/fmha/pipeline/block_fmha_pipeline_problem.hpp Source File#
block_fmha_pipeline_problem.hpp
Go to the documentation of this file.
Definition: cluster_descriptor.hpp:13
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition: type_traits.hpp:21
typename conditional< predicate, X, Y >::type conditional_t
Definition: functional.hpp:115
Definition: block_fmha_pipeline_problem.hpp:235
remove_cvref_t< QDataType_ > QDataType
Definition: block_fmha_pipeline_problem.hpp:236
static constexpr bool kPadSeqLenK
Definition: block_fmha_pipeline_problem.hpp:257
static constexpr bool kPadHeadDimQ
Definition: block_fmha_pipeline_problem.hpp:258
std::conditional_t< kIsVLayoutRowMajor_, ck_tile::tensor_layout::gemm::RowMajor, ck_tile::tensor_layout::gemm::ColumnMajor > VLayout
Definition: block_fmha_pipeline_problem.hpp:250
static constexpr auto RotaryEnum
Definition: block_fmha_pipeline_problem.hpp:252
static constexpr index_t kK0
Definition: block_fmha_pipeline_problem.hpp:245
static constexpr bool kPadSeqLenQ
Definition: block_fmha_pipeline_problem.hpp:256
remove_cvref_t< Traits_ > Traits
Definition: block_fmha_pipeline_problem.hpp:239
static constexpr bool kIsPagedKV
Definition: block_fmha_pipeline_problem.hpp:253
remove_cvref_t< VDataType_ > VDataType
Definition: block_fmha_pipeline_problem.hpp:238
static constexpr index_t kM0
Definition: block_fmha_pipeline_problem.hpp:243
static constexpr index_t kN1
Definition: block_fmha_pipeline_problem.hpp:246
static constexpr index_t kBlockPerCu
Definition: block_fmha_pipeline_problem.hpp:260
static constexpr index_t kBlockSize
Definition: block_fmha_pipeline_problem.hpp:241
static constexpr bool kPadHeadDimV
Definition: block_fmha_pipeline_problem.hpp:259
remove_cvref_t< KDataType_ > KDataType
Definition: block_fmha_pipeline_problem.hpp:237
static constexpr index_t kN0
Definition: block_fmha_pipeline_problem.hpp:244
Definition: block_fmha_pipeline_problem.hpp:80
remove_cvref_t< SMPLComputeDataType_ > SMPLComputeDataType
Definition: block_fmha_pipeline_problem.hpp:85
static constexpr bool kPadHeadDimQ
Definition: block_fmha_pipeline_problem.hpp:105
static constexpr bool kDoFp8StaticQuant
Definition: block_fmha_pipeline_problem.hpp:111
remove_cvref_t< Traits_ > Traits
Definition: block_fmha_pipeline_problem.hpp:94
static constexpr index_t kBlockPerCu
Definition: block_fmha_pipeline_problem.hpp:113
remove_cvref_t< BlockFmhaShape_ > BlockFmhaShape
Definition: block_fmha_pipeline_problem.hpp:91
static constexpr bool kPadHeadDimV
Definition: block_fmha_pipeline_problem.hpp:106
remove_cvref_t< VDataType_ > VDataType
Definition: block_fmha_pipeline_problem.hpp:83
remove_cvref_t< AttentionVariant_ > AttentionVariant
Definition: block_fmha_pipeline_problem.hpp:92
remove_cvref_t< FmhaMask_ > FmhaMask
Definition: block_fmha_pipeline_problem.hpp:93
remove_cvref_t< PDataType_ > PDataType
Definition: block_fmha_pipeline_problem.hpp:88
remove_cvref_t< SaccDataType_ > SaccDataType
Definition: block_fmha_pipeline_problem.hpp:84
remove_cvref_t< KDataType_ > KDataType
Definition: block_fmha_pipeline_problem.hpp:82
static constexpr auto BiasEnum
Definition: block_fmha_pipeline_problem.hpp:109
remove_cvref_t< QDataType_ > QDataType
Definition: block_fmha_pipeline_problem.hpp:81
remove_cvref_t< BiasDataType_ > BiasDataType
Definition: block_fmha_pipeline_problem.hpp:86
remove_cvref_t< OaccDataType_ > OaccDataType
Definition: block_fmha_pipeline_problem.hpp:89
static constexpr bool kHasLogitsSoftCap
Definition: block_fmha_pipeline_problem.hpp:107
static constexpr bool kPadSeqLenQ
Definition: block_fmha_pipeline_problem.hpp:103
static constexpr index_t kBlockSize
Definition: block_fmha_pipeline_problem.hpp:98
static constexpr bool kPadSeqLenK
Definition: block_fmha_pipeline_problem.hpp:104
remove_cvref_t< ODataType_ > ODataType
Definition: block_fmha_pipeline_problem.hpp:90
static constexpr index_t kNumGemm0Warps
Definition: block_fmha_pipeline_problem.hpp:96
static constexpr bool kIsGroupMode
Definition: block_fmha_pipeline_problem.hpp:100
remove_cvref_t< LSEDataType_ > LSEDataType
Definition: block_fmha_pipeline_problem.hpp:87
static constexpr bool kIsPagedKV
Definition: block_fmha_pipeline_problem.hpp:112
static constexpr bool kStoreLSE
Definition: block_fmha_pipeline_problem.hpp:110
static constexpr bool kSkipMinSeqlenQ
Definition: block_fmha_pipeline_problem.hpp:108
static constexpr index_t kNumGemm1Warps
Definition: block_fmha_pipeline_problem.hpp:97
Definition: block_fmha_pipeline_problem.hpp:132
static constexpr bool kHasUnevenSplits
Definition: block_fmha_pipeline_problem.hpp:164
remove_cvref_t< VDataType_ > VDataType
Definition: block_fmha_pipeline_problem.hpp:135
static constexpr bool kHasLogitsSoftCap
Definition: block_fmha_pipeline_problem.hpp:159
remove_cvref_t< FmhaMask_ > FmhaMask
Definition: block_fmha_pipeline_problem.hpp:145
static constexpr bool kPadHeadDimQ
Definition: block_fmha_pipeline_problem.hpp:157
static constexpr bool kDoFp8StaticQuant
Definition: block_fmha_pipeline_problem.hpp:162
static constexpr index_t kNumGemm0Warps
Definition: block_fmha_pipeline_problem.hpp:148
remove_cvref_t< QDataType_ > QDataType
Definition: block_fmha_pipeline_problem.hpp:133
remove_cvref_t< OaccDataType_ > OaccDataType
Definition: block_fmha_pipeline_problem.hpp:141
remove_cvref_t< LSEDataType_ > LSEDataType
Definition: block_fmha_pipeline_problem.hpp:139
static constexpr bool kIsGroupMode
Definition: block_fmha_pipeline_problem.hpp:152
static constexpr bool kMergeNumHeadGroupsSeqLenQ
Definition: block_fmha_pipeline_problem.hpp:165
static constexpr index_t kNumGemm1Warps
Definition: block_fmha_pipeline_problem.hpp:149
remove_cvref_t< SaccDataType_ > SaccDataType
Definition: block_fmha_pipeline_problem.hpp:136
static constexpr bool kIsPagedKV
Definition: block_fmha_pipeline_problem.hpp:163
remove_cvref_t< SMPLComputeDataType_ > SMPLComputeDataType
Definition: block_fmha_pipeline_problem.hpp:137
remove_cvref_t< BlockFmhaShape_ > BlockFmhaShape
Definition: block_fmha_pipeline_problem.hpp:143
remove_cvref_t< KDataType_ > KDataType
Definition: block_fmha_pipeline_problem.hpp:134
static constexpr bool kPadSeqLenQ
Definition: block_fmha_pipeline_problem.hpp:155
static constexpr index_t kBlockSize
Definition: block_fmha_pipeline_problem.hpp:150
static constexpr index_t kBlockPerCu
Definition: block_fmha_pipeline_problem.hpp:166
remove_cvref_t< PDataType_ > PDataType
Definition: block_fmha_pipeline_problem.hpp:140
remove_cvref_t< ODataType_ > ODataType
Definition: block_fmha_pipeline_problem.hpp:142
static constexpr auto BiasEnum
Definition: block_fmha_pipeline_problem.hpp:160
remove_cvref_t< AttentionVariant_ > AttentionVariant
Definition: block_fmha_pipeline_problem.hpp:144
static constexpr bool kPadSeqLenK
Definition: block_fmha_pipeline_problem.hpp:156
static constexpr bool kStoreLSE
Definition: block_fmha_pipeline_problem.hpp:161
remove_cvref_t< BiasDataType_ > BiasDataType
Definition: block_fmha_pipeline_problem.hpp:138
static constexpr bool kPadHeadDimV
Definition: block_fmha_pipeline_problem.hpp:158
remove_cvref_t< Traits_ > Traits
Definition: block_fmha_pipeline_problem.hpp:146
Definition: block_fmha_pipeline_problem.hpp:27
remove_cvref_t< AttentionVariant_ > AttentionVariant
Definition: block_fmha_pipeline_problem.hpp:40
remove_cvref_t< KDataType_ > KDataType
Definition: block_fmha_pipeline_problem.hpp:29
remove_cvref_t< SaccDataType_ > SaccDataType
Definition: block_fmha_pipeline_problem.hpp:31
static constexpr bool kSkipMinSeqlenQ
Definition: block_fmha_pipeline_problem.hpp:56
remove_cvref_t< SMPLComputeDataType_ > SMPLComputeDataType
Definition: block_fmha_pipeline_problem.hpp:32
remove_cvref_t< FmhaMask_ > FmhaMask
Definition: block_fmha_pipeline_problem.hpp:41
remove_cvref_t< BiasDataType_ > BiasDataType
Definition: block_fmha_pipeline_problem.hpp:33
static constexpr bool kHasDropout
Definition: block_fmha_pipeline_problem.hpp:59
remove_cvref_t< QDataType_ > QDataType
Definition: block_fmha_pipeline_problem.hpp:28
remove_cvref_t< ODataType_ > ODataType
Definition: block_fmha_pipeline_problem.hpp:38
static constexpr index_t kBlockPerCu
Definition: block_fmha_pipeline_problem.hpp:61
static constexpr bool kStoreLSE
Definition: block_fmha_pipeline_problem.hpp:58
remove_cvref_t< BlockFmhaShape_ > BlockFmhaShape
Definition: block_fmha_pipeline_problem.hpp:39
static constexpr auto BiasEnum
Definition: block_fmha_pipeline_problem.hpp:57
static constexpr bool kPadHeadDimQ
Definition: block_fmha_pipeline_problem.hpp:53
remove_cvref_t< LSEDataType_ > LSEDataType
Definition: block_fmha_pipeline_problem.hpp:35
remove_cvref_t< Traits_ > Traits
Definition: block_fmha_pipeline_problem.hpp:42
static constexpr bool kPadHeadDimV
Definition: block_fmha_pipeline_problem.hpp:54
remove_cvref_t< OaccDataType_ > OaccDataType
Definition: block_fmha_pipeline_problem.hpp:37
static constexpr bool kIsGroupMode
Definition: block_fmha_pipeline_problem.hpp:48
static constexpr bool kPadSeqLenK
Definition: block_fmha_pipeline_problem.hpp:52
remove_cvref_t< PDataType_ > PDataType
Definition: block_fmha_pipeline_problem.hpp:36
static constexpr index_t kNumGemm0Warps
Definition: block_fmha_pipeline_problem.hpp:44
static constexpr bool kHasLogitsSoftCap
Definition: block_fmha_pipeline_problem.hpp:55
remove_cvref_t< RandValOutputDataType_ > RandValOutputDataType
Definition: block_fmha_pipeline_problem.hpp:34
static constexpr index_t kNumGemm1Warps
Definition: block_fmha_pipeline_problem.hpp:45
remove_cvref_t< VDataType_ > VDataType
Definition: block_fmha_pipeline_problem.hpp:30
static constexpr bool kDoFp8StaticQuant
Definition: block_fmha_pipeline_problem.hpp:60
static constexpr index_t kBlockSize
Definition: block_fmha_pipeline_problem.hpp:46
static constexpr bool kPadSeqLenQ
Definition: block_fmha_pipeline_problem.hpp:51
Definition: block_fmha_pipeline_problem.hpp:189
remove_cvref_t< ODataType_ > ODataType
Definition: block_fmha_pipeline_problem.hpp:194
static constexpr index_t kNumWarps
Definition: block_fmha_pipeline_problem.hpp:216
remove_cvref_t< Traits_ > Traits
Definition: block_fmha_pipeline_problem.hpp:195
static constexpr index_t kHeadDimV
Definition: block_fmha_pipeline_problem.hpp:199
static constexpr index_t kBlockSize
Definition: block_fmha_pipeline_problem.hpp:217
static constexpr index_t kM0
Definition: block_fmha_pipeline_problem.hpp:177
static constexpr index_t kBlockPerCu
Definition: block_fmha_pipeline_problem.hpp:212
static constexpr bool kIsGroupMode
Definition: block_fmha_pipeline_problem.hpp:200
static constexpr index_t kMaxSplits
Definition: block_fmha_pipeline_problem.hpp:213
static constexpr bool kPadHeadDimV
Definition: block_fmha_pipeline_problem.hpp:209
static constexpr bool kStoreLSE
Definition: block_fmha_pipeline_problem.hpp:210
static constexpr bool kDoFp8StaticQuant
Definition: block_fmha_pipeline_problem.hpp:211
remove_cvref_t< LSEDataType_ > LSEDataType
Definition: block_fmha_pipeline_problem.hpp:192
static constexpr bool kPadSeqLenQ
Definition: block_fmha_pipeline_problem.hpp:208
static constexpr index_t kN1
Definition: block_fmha_pipeline_problem.hpp:175
remove_cvref_t< OaccDataType_ > OaccDataType
Definition: block_fmha_pipeline_problem.hpp:193
Definition: block_fmha_pipeline_problem.hpp:172
static constexpr index_t NThreads
Definition: block_fmha_pipeline_problem.hpp:176
static constexpr index_t kM0
Definition: block_fmha_pipeline_problem.hpp:177
static constexpr index_t MaxVectorSize
Definition: block_fmha_pipeline_problem.hpp:173
static constexpr index_t kN1
Definition: block_fmha_pipeline_problem.hpp:175
Definition: tensor_layout.hpp:22
Definition: tensor_layout.hpp:17