/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-7.0.0/include/ck_tile/ops/gemm/warp/warp_gemm.hpp Source File

/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-7.0.0/include/ck_tile/ops/gemm/warp/warp_gemm.hpp Source File#

Composable Kernel: /home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-7.0.0/include/ck_tile/ops/gemm/warp/warp_gemm.hpp Source File
warp_gemm.hpp
Go to the documentation of this file.
1 // SPDX-License-Identifier: MIT
2 // Copyright (c) 2018-2025, Advanced Micro Devices, Inc. All rights reserved.
3 
4 #pragma once
5 
6 #include "ck_tile/core.hpp"
9 
12 
13 namespace ck_tile {
14 
15 // fp16
16 
19 
22 
23 #if defined(__gfx950__)
26 
27 #else
30  2>>;
31 #endif
32 
33 #if defined(__gfx950__)
36 #else
39  2>>;
40 #endif
41 
44  1>>;
45 
48  2>>;
49 
53 
57 
58 #if defined(__gfx950__)
62 #else
66  2>>;
67 #endif
68 
69 #if defined(__gfx950__)
73 #else
77  2>>;
78 #endif
79 
80 #if defined(__gfx950__)
81 using WarpGemmMfmaF16F16F32M16N16K32SwizzleBTransposedCDistribution =
84  1>>;
85 
86 using WarpGemmMfmaBf16Bf16F32M16N16K32SwizzleBTransposedCDistribution =
89  1>>;
90 #endif
91 
92 #if defined(__gfx950__)
96 #else
100  2>>;
101 #endif
102 
105  4>>;
106 
109  4>>;
110 
111 // fp16 2:4 structured sparsity
114 
117 
118 // bf16
121 
124 
125 #if defined(__gfx950__)
128 
129 #else
132  2>>;
133 #endif
134 
135 #if defined(__gfx950__)
138 #else
141  2>>;
142 #endif
143 
146  1>>;
147 
151  2>>;
152 
156 
160 
161 #if defined(__gfx950__)
165 #else
169  2>>;
170 #endif
171 
172 #if defined(__gfx950__)
176 #else
180  2>>;
181 #endif
182 
183 #if defined(__gfx950__)
187 #else
191  2>>;
192 #endif
193 
196  4>>;
197 
200  4>>;
201 
202 // fp8
203 
206 
209 
212 
215 
218  2>>;
219 
222  2>>;
223 
226 
229 
232  2>>;
233 
236  2>>;
237 
240 
243 
246 
249 
252 
255 
258 
261 
265 
269 
273 
277 
278 template <index_t swizzle_factor = 2>
282  2,
283  swizzle_factor>>;
284 
285 // int8
288 
292 
295 
299 
300 } // namespace ck_tile
Definition: cluster_descriptor.hpp:13
Definition: warp_gemm_attribute_mfma.hpp:13
Definition: warp_gemm_attribute_mfma.hpp:814
Definition: warp_gemm_attribute_mfma.hpp:455
Definition: warp_gemm_attribute_mfma.hpp:78
Definition: warp_gemm_attribute_mfma.hpp:361
Definition: warp_gemm_attribute_mfma.hpp:294
Definition: warp_gemm_attribute_mfma_impl.hpp:1347
Definition: warp_gemm_attribute_mfma_impl.hpp:983
Definition: warp_gemm_attribute_mfma_impl.hpp:1142
Definition: warp_gemm_attribute_mfma_impl.hpp:1614
Definition: warp_gemm_attribute_mfma_impl.hpp:1544
Definition: warp_gemm_attribute_mfma_impl.hpp:537
Definition: warp_gemm_attribute_mfma_impl.hpp:67
Definition: warp_gemm_attribute_mfma_impl.hpp:868
Definition: warp_gemm_attribute_mfma_impl.hpp:448
Definition: warp_gemm_attribute_mfma_impl.hpp:625
Definition: warp_gemm_attribute_mfma_impl.hpp:689
Definition: warp_gemm_attribute_mfma_impl.hpp:193
Definition: warp_gemm_attribute_mfma_impl.hpp:256
Definition: warp_gemm_attribute_mfma_impl.hpp:754
Definition: warp_gemm_attribute_mfma_impl.hpp:130
Definition: warp_gemm_attribute_mfma_impl.hpp:319
Definition: warp_gemm_attribute_mfma_impl.hpp:383
Class describing structured sparsity mfma instructions.
Definition: warp_gemm_attribute_smfmac.hpp:26
Definition: warp_gemm_attribute_smfmac_impl.hpp:65
Definition: warp_gemm_attribute_smfmac_impl.hpp:14
Definition: warp_gemm_impl.hpp:11
Definition: warp_gemm_smfmac_impl.hpp:11