/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-6.4.3/include/ck/tensor_operation/gpu/device/impl/device_sparse_embeddings_forward_layernorm.hpp Source File#
device_sparse_embeddings_forward_layernorm.hpp
Go to the documentation of this file.
float launch_and_time_kernel(const StreamConfig &stream_config, F kernel, dim3 grid_dim, dim3 block_dim, std::size_t lds_byte, Args... args)
Definition: kernel_launch.hpp:13
Definition: ck.hpp:264
__host__ constexpr __device__ auto make_naive_tensor_descriptor_packed(const Tuple< Lengths... > &lengths)
Definition: tensor_descriptor_helper.hpp:101
__global__ void kernel_sparse_embeddings_forward_layernorm(OutType *p_out, const ck::Array< EmbType *, NumEmbeddings > p_embs, const ck::Array< IndexType *, NumEmbeddings > p_indexes, const GammaDataType *p_gamma, const BetaDataType *p_beta, const OutGridDesc out_grid_desc, const AccDataType epsilon, const EmbElementwiseOperation emb_elementwise_op)
Definition: gridwise_sparse_embeddings_forward_layernorm.hpp:26
Definition: stream_config.hpp:10
Definition: gridwise_sparse_embeddings_forward_layernorm.hpp:57
Definition: device_base.hpp:50
Definition: device_base.hpp:61
Definition: device_base.hpp:76
Definition: device_sparse_embeddings_forward_layernorm.hpp:44
const GammaDataType * p_gamma_
Definition: device_sparse_embeddings_forward_layernorm.hpp:70
ck::index_t IndexLength_
Definition: device_sparse_embeddings_forward_layernorm.hpp:73
ck::Array< EmbType *, NumEmbeddings > p_embs_
Definition: device_sparse_embeddings_forward_layernorm.hpp:68
size_t grid_size_
Definition: device_sparse_embeddings_forward_layernorm.hpp:77
OutType * p_out_
Definition: device_sparse_embeddings_forward_layernorm.hpp:67
const BetaDataType * p_beta_
Definition: device_sparse_embeddings_forward_layernorm.hpp:71
ck::index_t EmbeddingDim_
Definition: device_sparse_embeddings_forward_layernorm.hpp:72
Argument(OutType *p_out, const ck::Array< EmbType *, NumEmbeddings > &p_embs, const ck::Array< IndexType *, NumEmbeddings > &p_indexs, const GammaDataType *p_gamma, const BetaDataType *p_beta, const ck::index_t EmbeddingDim, const ck::index_t IndexLength, const AccDataType epsilon, const EmbElementwiseOperation emb_elementwise_op)
Definition: device_sparse_embeddings_forward_layernorm.hpp:45
AccDataType epsilon_
Definition: device_sparse_embeddings_forward_layernorm.hpp:74
ck::Array< IndexType *, NumEmbeddings > p_indexs_
Definition: device_sparse_embeddings_forward_layernorm.hpp:69
EmbElementwiseOperation emb_elementwise_op_
Definition: device_sparse_embeddings_forward_layernorm.hpp:75
Definition: device_sparse_embeddings_forward_layernorm.hpp:121
float Run(const Argument &arg, const StreamConfig &stream_config=StreamConfig{})
Definition: device_sparse_embeddings_forward_layernorm.hpp:122
float Run(const BaseArgument *p_arg, const StreamConfig &stream_config=StreamConfig{}) override
Definition: device_sparse_embeddings_forward_layernorm.hpp:154
Definition: device_sparse_embeddings_forward_layernorm.hpp:37
std::unique_ptr< BaseArgument > MakeArgumentPointer(void *p_out, const ck::Array< EmbType *, NumEmbeddings > &p_embs, const ck::Array< IndexType *, NumEmbeddings > &p_indexs, const void *p_gamma, const void *p_beta, ck::index_t EmbeddingDim, ck::index_t IndexLength, const AccDataType epsilon, const EmbElementwiseOperation emb_elementwise_op)
Definition: device_sparse_embeddings_forward_layernorm.hpp:81
virtual std::unique_ptr< BaseInvoker > MakeInvokerPointer()
Definition: device_sparse_embeddings_forward_layernorm.hpp:171
static bool IsSupportedArgument(const Argument *p_arg)
Definition: device_sparse_embeddings_forward_layernorm.hpp:161
bool IsSupportedArgument(const BaseArgument *p_arg) override
Definition: device_sparse_embeddings_forward_layernorm.hpp:166
GridwiseSparseEmbeddingsForwardLayernorm< EmbType, IndexType, GammaDataType, BetaDataType, AccDataType, OutType, decltype(MakeOutputDescriptor(1, 1)), EmbElementwiseOperation, BlockSize, DimClusterSize, RowClusterSize, DimPerBlock, RowPerBlock, DimThreadSize, RowVectorSize, NumEmbeddings > GridwiseSparseEmbedding
Definition: device_sparse_embeddings_forward_layernorm.hpp:118
std::string GetTypeString() const override
Definition: device_sparse_embeddings_forward_layernorm.hpp:176
static auto MakeOutputDescriptor(const index_t index_length, const index_t rows)
Definition: device_sparse_embeddings_forward_layernorm.hpp:38