Argument Struct Reference#
ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument Struct Reference
#include <device_batchnorm_backward_impl.hpp>
Inheritance diagram for ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument:
Public Member Functions | |
| Argument (const std::array< index_t, Rank > xyLengths, const std::array< index_t, Rank > xStrides, const std::array< index_t, Rank > dyStrides, const std::array< index_t, Rank > dxStrides, const std::array< int, NumBatchNormReduceDim > reduceDims, const std::array< ck::index_t, NumInvariantDim > bnScaleBiasMeanVarLengths, const std::array< ck::index_t, NumInvariantDim > bnScaleStrides, const std::array< ck::index_t, NumInvariantDim > bnDscaleDbiasStrides, const std::array< ck::index_t, NumInvariantDim > bnMeanVarStrides, const XDataType *p_x, const DyDataType *p_dy, const ScaleDataType *p_scale, const MeanVarDataType *p_savedMean, const MeanVarDataType *p_savedInvVar, const DyElementwiseOp dy_elementwise_op, double epsilon, DxDataType *p_dx, DscaleDbiasDataType *p_dscale, DscaleDbiasDataType *p_dbias) | |
Public Member Functions inherited from ck::tensor_operation::device::BaseArgument | |
| BaseArgument ()=default | |
| BaseArgument (const BaseArgument &)=default | |
| BaseArgument & | operator= (const BaseArgument &)=default |
| virtual | ~BaseArgument () |
Constructor & Destructor Documentation
◆ Argument()
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
|
inline |
Member Data Documentation
◆ blkGroupSize
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| int ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::blkGroupSize |
◆ bnDscaleDbiasStrides_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| std::array<index_t, Rank - NumBatchNormReduceDim> ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::bnDscaleDbiasStrides_ |
◆ bnMeanVarStrides_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| std::array<index_t, Rank - NumBatchNormReduceDim> ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::bnMeanVarStrides_ |
◆ bnScaleBiasMeanVarLengths_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| std::array<index_t, Rank - NumBatchNormReduceDim> ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::bnScaleBiasMeanVarLengths_ |
◆ bnScaleStrides_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| std::array<index_t, Rank - NumBatchNormReduceDim> ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::bnScaleStrides_ |
◆ dscale_dbias_grid_desc_m
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| ScaleBiasGridDesc_M ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::dscale_dbias_grid_desc_m |
◆ dx_grid_desc_m_k
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| XYGridDesc_M_K ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::dx_grid_desc_m_k |
◆ dxStrides_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| std::array<index_t, Rank> ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::dxStrides_ |
◆ dy_elementwise_op_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| const DyElementwiseOp ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::dy_elementwise_op_ |
◆ dy_grid_desc_m_k
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| XYGridDesc_M_K ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::dy_grid_desc_m_k |
◆ dyStrides_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| std::array<index_t, Rank> ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::dyStrides_ |
◆ epsilon_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| AccDataType ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::epsilon_ |
◆ gridSize
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| size_t ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::gridSize |
◆ haveSavedMeanInvVar_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| bool ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::haveSavedMeanInvVar_ |
◆ invariant_length
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| long_index_t ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::invariant_length |
◆ mean_var_grid_desc_m
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| MeanVarGridDesc_M ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::mean_var_grid_desc_m |
◆ numBlockTileIteration
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| int ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::numBlockTileIteration |
◆ p_dbias_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| DscaleDbiasDataType* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::p_dbias_ |
◆ p_dscale_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| DscaleDbiasDataType* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::p_dscale_ |
◆ p_dx_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| DxDataType* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::p_dx_ |
◆ p_dy_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| const DyDataType* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::p_dy_ |
◆ p_savedInvVar_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| const MeanVarDataType* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::p_savedInvVar_ |
◆ p_savedMean_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| const MeanVarDataType* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::p_savedMean_ |
◆ p_scale_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| const ScaleDataType* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::p_scale_ |
◆ p_x_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| const XDataType* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::p_x_ |
◆ reduce_length
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| long_index_t ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::reduce_length |
◆ scale_grid_desc_m
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| ScaleBiasGridDesc_M ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::scale_grid_desc_m |
◆ workspace_count
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| void* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::workspace_count |
◆ workspace_mean
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| void* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::workspace_mean |
◆ workspace_reduce_dbias
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| void* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::workspace_reduce_dbias |
◆ workspace_reduce_dscale
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| void* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::workspace_reduce_dscale |
◆ workspace_savedInvVar
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| void* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::workspace_savedInvVar |
◆ workspace_savedMean
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| void* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::workspace_savedMean |
◆ workspace_variance
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| void* ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::workspace_variance |
◆ x_grid_desc_m_k
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| XYGridDesc_M_K ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::x_grid_desc_m_k |
◆ xStrides_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| std::array<index_t, Rank> ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::xStrides_ |
◆ xyLengths_
template<typename XDataType , typename DxDataType , typename DyDataType , typename AccDataType , typename ScaleDataType , typename DscaleDbiasDataType , typename MeanVarDataType , typename DyElementwiseOp , index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XDyDxVectorDim, index_t XSrcVectorSize, index_t DySrcVectorSize, index_t DxDstVectorSize, index_t ScaleSrcVectorSize, index_t DscaleDbiasDstVectorSize, index_t MeanVarSrcVectorSize>
| std::array<index_t, Rank> ck::tensor_operation::device::DeviceBatchNormBwdImpl< XDataType, DxDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyDxVectorDim, XSrcVectorSize, DySrcVectorSize, DxDstVectorSize, ScaleSrcVectorSize, DscaleDbiasDstVectorSize, MeanVarSrcVectorSize >::Argument::xyLengths_ |
The documentation for this struct was generated from the following file:
- /home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/docs-7.0.1/include/ck/tensor_operation/gpu/device/impl/device_batchnorm_backward_impl.hpp
Public Member Functions inherited from