DeviceBatchNormFwdImpl< XDataType, YDataType, AccDataType, ScaleDataType, BiasDataType, MeanVarDataType, YElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XSrcYDstVectorDim, XSrcVectorSize, YDstVectorSize, ScaleSrcVectorSize, BiasSrcVectorSize, MeanVarSrcDstVectorSize > Struct Template Reference#
Classes |
Public Types |
Public Member Functions |
Static Public Member Functions |
Static Public Attributes |
List of all members
ck::tensor_operation::device::DeviceBatchNormFwdImpl< XDataType, YDataType, AccDataType, ScaleDataType, BiasDataType, MeanVarDataType, YElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XSrcYDstVectorDim, XSrcVectorSize, YDstVectorSize, ScaleSrcVectorSize, BiasSrcVectorSize, MeanVarSrcDstVectorSize > Struct Template Reference
#include <device_batchnorm_forward_impl.hpp>
Inheritance diagram for ck::tensor_operation::device::DeviceBatchNormFwdImpl< XDataType, YDataType, AccDataType, ScaleDataType, BiasDataType, MeanVarDataType, YElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XSrcYDstVectorDim, XSrcVectorSize, YDstVectorSize, ScaleSrcVectorSize, BiasSrcVectorSize, MeanVarSrcDstVectorSize >:
Classes | |
| struct | Argument |
| struct | Invoker |
Public Types | |
| using | XYGridDesc_M_K = decltype(MakeXY2dDescriptor({1}, {1}, 1, 1)) |
| using | ScaleBiasMeanVarGridDesc_M = decltype(MakeScaleBiasMeanVar1dDescriptor({1}, {1})) |
| using | XYGridDesc_M_K = decltype(MakeXY2dDescriptor({1}, {1}, 1, 1)) |
| using | ScaleBiasMeanVarGridDesc_M = decltype(MakeScaleBiasMeanVar1dDescriptor({1}, {1})) |
Public Member Functions | |
| size_t | GetWorkSpaceSize (const BaseArgument *pArg) const override |
| void | SetWorkSpacePointer (BaseArgument *pArg, void *p_workspace, const StreamConfig &=StreamConfig{}) const override |
| bool | IsSupportedArgument (const BaseArgument *pArg) override |
| std::unique_ptr< BaseArgument > | MakeArgumentPointer (const std::array< index_t, Rank > xyLengths, const std::array< index_t, Rank > xStrides, const std::array< index_t, Rank > yStrides, const std::array< int, NumBatchNormReduceDim > reduceDims, const std::array< index_t, Rank - NumBatchNormReduceDim > bnScaleBiasMeanVarLengths, const std::array< index_t, Rank - NumBatchNormReduceDim > bnScaleStrides, const std::array< index_t, Rank - NumBatchNormReduceDim > bnBiasStrides, const std::array< index_t, Rank - NumBatchNormReduceDim > bnMeanVarStrides, const void *p_x, const void *p_scale, const void *p_bias, double epsilon, const YElementwiseOp y_elementwise_op, void *p_y, void *resultSaveMean, void *resultSaveInvVariance, double averageFactor, void *resultRunningMean, void *resultRunningVariance) override |
| std::unique_ptr< BaseInvoker > | MakeInvokerPointer () override |
| std::string | GetTypeString () const override |
| size_t | GetWorkSpaceSize (const BaseArgument *pArg) const override |
| void | SetWorkSpacePointer (BaseArgument *pArg, void *p_workspace, const StreamConfig &=StreamConfig{}) const override |
| bool | IsSupportedArgument (const BaseArgument *pArg) override |
| std::unique_ptr< BaseArgument > | MakeArgumentPointer (const std::array< index_t, Rank > xyLengths, const std::array< index_t, Rank > xStrides, const std::array< index_t, Rank > yStrides, const std::array< int, NumBatchNormReduceDim > reduceDims, const std::array< index_t, Rank - NumBatchNormReduceDim > bnScaleBiasMeanVarLengths, const std::array< index_t, Rank - NumBatchNormReduceDim > bnScaleStrides, const std::array< index_t, Rank - NumBatchNormReduceDim > bnBiasStrides, const std::array< index_t, Rank - NumBatchNormReduceDim > bnMeanVarStrides, const void *p_x, const void *p_scale, const void *p_bias, double epsilon, const YElementwiseOp y_elementwise_op, void *p_y, void *resultSaveMean, void *resultSaveInvVariance, double averageFactor, void *resultRunningMean, void *resultRunningVariance) override |
| std::unique_ptr< BaseInvoker > | MakeInvokerPointer () override |
| std::string | GetTypeString () const override |
| Public Member Functions inherited from ck::tensor_operation::device::BaseOperator | |
| BaseOperator ()=default | |
| BaseOperator (const BaseOperator &)=default | |
| BaseOperator & | operator= (const BaseOperator &)=default |
| virtual std::string | GetInstanceString () const |
| virtual std::string | GetTypeIdName () const |
| virtual std::optional< std::string > | GetObjectName () const |
| virtual std::optional< std::string > | GetTemplateInfo () const |
| virtual std::string | GetTypeIdHashCode () const |
| virtual | ~BaseOperator () |
Static Public Member Functions | |
| static auto | MakeXY2dDescriptor (const std::array< index_t, Rank > &xyLengths, const std::array< index_t, Rank > &xyStrides, int blkGroupSize, int numBlockTileIteration) |
| static auto | MakeMeanVarCountOutputMG2dDescriptor (int invariantLength, int blkGroupSize) |
| static auto | MakeMeanVarCountInputMK2dDescriptor (int invariantLength, int blkGroupSize) |
| static auto | MakeScaleBiasMeanVar1dDescriptor (const std::array< index_t, NumInvariantDim > &lengths, const std::array< index_t, NumInvariantDim > &strides) |
| static auto | MakeXY2dDescriptor (const std::array< index_t, Rank > &xyLengths, const std::array< index_t, Rank > &xyStrides, int blkGroupSize, int numBlockTileIteration) |
| static auto | MakeMeanVarCountOutputMG2dDescriptor (int invariantLength, int blkGroupSize) |
| static auto | MakeMeanVarCountInputMK2dDescriptor (int invariantLength, int blkGroupSize) |
| static auto | MakeScaleBiasMeanVar1dDescriptor (const std::array< index_t, NumInvariantDim > &lengths, const std::array< index_t, NumInvariantDim > &strides) |
Static Public Attributes | |
| static constexpr index_t | NumInvariantDim = Rank - NumBatchNormReduceDim |
| static constexpr index_t | M_BlockTileSize = MThreadClusterSize * MThreadSliceSize |
| static constexpr index_t | K_BlockTileSize = KThreadClusterSize * KThreadSliceSize |
Member Typedef Documentation
◆ ScaleBiasMeanVarGridDesc_M [1/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
| using ck::tensor_operation::device::DeviceBatchNormFwdImpl< XDataType, YDataType, AccDataType, ScaleDataType, BiasDataType, MeanVarDataType, YElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XSrcYDstVectorDim, XSrcVectorSize, YDstVectorSize, ScaleSrcVectorSize, BiasSrcVectorSize, MeanVarSrcDstVectorSize >::ScaleBiasMeanVarGridDesc_M = decltype(MakeScaleBiasMeanVar1dDescriptor({1}, {1})) |
◆ ScaleBiasMeanVarGridDesc_M [2/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
| using ck::tensor_operation::device::DeviceBatchNormFwdImpl< XDataType, YDataType, AccDataType, ScaleDataType, BiasDataType, MeanVarDataType, YElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XSrcYDstVectorDim, XSrcVectorSize, YDstVectorSize, ScaleSrcVectorSize, BiasSrcVectorSize, MeanVarSrcDstVectorSize >::ScaleBiasMeanVarGridDesc_M = decltype(MakeScaleBiasMeanVar1dDescriptor({1}, {1})) |
◆ XYGridDesc_M_K [1/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
| using ck::tensor_operation::device::DeviceBatchNormFwdImpl< XDataType, YDataType, AccDataType, ScaleDataType, BiasDataType, MeanVarDataType, YElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XSrcYDstVectorDim, XSrcVectorSize, YDstVectorSize, ScaleSrcVectorSize, BiasSrcVectorSize, MeanVarSrcDstVectorSize >::XYGridDesc_M_K = decltype(MakeXY2dDescriptor({1}, {1}, 1, 1)) |
◆ XYGridDesc_M_K [2/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
| using ck::tensor_operation::device::DeviceBatchNormFwdImpl< XDataType, YDataType, AccDataType, ScaleDataType, BiasDataType, MeanVarDataType, YElementwiseOp, Rank, NumBatchNormReduceDim, UseMultiblockInK, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XSrcYDstVectorDim, XSrcVectorSize, YDstVectorSize, ScaleSrcVectorSize, BiasSrcVectorSize, MeanVarSrcDstVectorSize >::XYGridDesc_M_K = decltype(MakeXY2dDescriptor({1}, {1}, 1, 1)) |
Member Function Documentation
◆ GetTypeString() [1/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlineoverridevirtual |
Reimplemented from ck::tensor_operation::device::BaseOperator.
◆ GetTypeString() [2/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlineoverridevirtual |
Reimplemented from ck::tensor_operation::device::BaseOperator.
◆ GetWorkSpaceSize() [1/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlineoverridevirtual |
Reimplemented from ck::tensor_operation::device::BaseOperator.
◆ GetWorkSpaceSize() [2/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlineoverridevirtual |
Reimplemented from ck::tensor_operation::device::BaseOperator.
◆ IsSupportedArgument() [1/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlineoverridevirtual |
Reimplemented from ck::tensor_operation::device::BaseOperator.
◆ IsSupportedArgument() [2/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlineoverridevirtual |
Reimplemented from ck::tensor_operation::device::BaseOperator.
◆ MakeArgumentPointer() [1/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlineoverridevirtual |
◆ MakeArgumentPointer() [2/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlineoverridevirtual |
◆ MakeInvokerPointer() [1/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlineoverridevirtual |
◆ MakeInvokerPointer() [2/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlineoverridevirtual |
◆ MakeMeanVarCountInputMK2dDescriptor() [1/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlinestatic |
◆ MakeMeanVarCountInputMK2dDescriptor() [2/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlinestatic |
◆ MakeMeanVarCountOutputMG2dDescriptor() [1/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlinestatic |
◆ MakeMeanVarCountOutputMG2dDescriptor() [2/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlinestatic |
◆ MakeScaleBiasMeanVar1dDescriptor() [1/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlinestatic |
◆ MakeScaleBiasMeanVar1dDescriptor() [2/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlinestatic |
◆ MakeXY2dDescriptor() [1/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlinestatic |
◆ MakeXY2dDescriptor() [2/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlinestatic |
◆ SetWorkSpacePointer() [1/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlineoverridevirtual |
Reimplemented from ck::tensor_operation::device::BaseOperator.
◆ SetWorkSpacePointer() [2/2]
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
inlineoverridevirtual |
Reimplemented from ck::tensor_operation::device::BaseOperator.
Member Data Documentation
◆ K_BlockTileSize
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
staticconstexpr |
◆ M_BlockTileSize
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
staticconstexpr |
◆ NumInvariantDim
template<typename XDataType, typename YDataType, typename AccDataType, typename ScaleDataType, typename BiasDataType, typename MeanVarDataType, typename YElementwiseOp, index_t Rank, index_t NumBatchNormReduceDim, bool UseMultiblockInK, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t XSrcYDstVectorDim, index_t XSrcVectorSize, index_t YDstVectorSize, index_t ScaleSrcVectorSize, index_t BiasSrcVectorSize, index_t MeanVarSrcDstVectorSize>
|
staticconstexpr |
The documentation for this struct was generated from the following files: