/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-6.4.3/include/ck_tile/host/reference/reference_rmsnorm2d_fwd.hpp Source File#
reference_rmsnorm2d_fwd.hpp
Go to the documentation of this file.
Definition: cluster_descriptor.hpp:13
CK_TILE_HOST auto make_ParallelTensorFunctor(F f, Xs... xs)
Definition: host_tensor.hpp:272
void reference_rmsnorm2d_fwd(const HostTensor< XDataType > &x_m_n, const HostTensor< GammaDataType > &gamma_n, HostTensor< YDataType > &y_m_n, HostTensor< InvRmsDataType > &invRms_m, ComputeDataType epsilon, Epilogue epilogue_functor={})
Definition: reference_rmsnorm2d_fwd.hpp:39
const std::vector< std::size_t > & get_lengths() const
Definition: host_tensor.hpp:162
Definition: host_tensor.hpp:279
Definition: reference_rmsnorm2d_fwd.hpp:13
auto operator()(int m, const HostTensor< AccDataType > &acc)
Definition: reference_rmsnorm2d_fwd.hpp:25
void operator()(int m, HostTensor< OutDataType > &o, const HostTensor< AccDataType > &acc)
Definition: reference_rmsnorm2d_fwd.hpp:15