/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck/tensor_operation/gpu/device/impl/device_gemm_reduce_wmma_cshuffle_v3.hpp File Reference#
device_gemm_reduce_wmma_cshuffle_v3.hpp File Reference
#include <iostream>#include <sstream>#include "ck/utility/common_header.hpp"#include "ck/tensor_description/tensor_descriptor.hpp"#include "ck/tensor_description/tensor_descriptor_helper.hpp"#include "ck/tensor_operation/gpu/device/tensor_layout.hpp"#include "ck/tensor_operation/gpu/device/device_gemm_reduce.hpp"#include "ck/tensor_operation/gpu/device/gemm_specialization.hpp"#include "ck/tensor_operation/gpu/grid/gridwise_gemm_wmma_cshuffle_v3.hpp"#include "ck/host_utility/device_prop.hpp"#include "ck/host_utility/kernel_launch.hpp"Go to the source code of this file.
Namespaces | |
| ck | |
| ck::tensor_operation | |
| ck::tensor_operation::device | |
Functions | |
| template<typename GridwiseGemm , typename ReduceTrait , bool HasMainKBlockLoop, InMemoryDataOperationEnum EGlobalMemoryDataOperation, index_t MinimumOccupancy = 1, TailNumber TailNum = TailNumber::Full> | |
| __global__ void | ck::kernel_gemm_reduce_wmma_cshuffle_v3 (typename GridwiseGemm::Argument karg, typename ReduceTrait::ReducePtrsGlobal_ p_reduces_grid, const typename ReduceTrait::ReduceInElementwiseOperations_ reduce_in_element_ops, const typename ReduceTrait::ReduceAccElementwiseOperations_ reduce_out_element_ops) |