DeviceSoftmaxImpl< InDataType, AccDataType, OutDataType, InElementwiseOp, AccElementwiseOp, Rank, NumReduceDim, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, InSrcVectorDim, InSrcVectorSize, OutDstVectorSize > Struct Template Reference#
Classes |
Public Types |
Public Member Functions |
Static Public Member Functions |
Static Public Attributes |
List of all members
ck::tensor_operation::device::DeviceSoftmaxImpl< InDataType, AccDataType, OutDataType, InElementwiseOp, AccElementwiseOp, Rank, NumReduceDim, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, InSrcVectorDim, InSrcVectorSize, OutDstVectorSize > Struct Template Reference
#include <device_softmax_impl.hpp>
Inheritance diagram for ck::tensor_operation::device::DeviceSoftmaxImpl< InDataType, AccDataType, OutDataType, InElementwiseOp, AccElementwiseOp, Rank, NumReduceDim, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, InSrcVectorDim, InSrcVectorSize, OutDstVectorSize >:
Classes | |
| struct | Argument |
| struct | Invoker |
Public Types | |
| using | GridDesc_M_K = decltype(MakeSrc2dDescriptor({1}, {1}, 1, 1)) |
| using | GridwiseSoftmaxGeneric |
| using | GridwiseSoftmaxSweepOnce |
Public Member Functions | |
| bool | IsSupportedArgument (const BaseArgument *p_arg) override |
| std::unique_ptr< BaseArgument > | MakeArgumentPointer (const std::vector< index_t > inLengths, const std::vector< index_t > inStrides, const std::vector< int > reduceDims, double alpha, double beta, const void *in_dev, void *out_dev, InElementwiseOp in_elementwise_op, AccElementwiseOp acc_elementwise_op) override |
| std::unique_ptr< BaseInvoker > | MakeInvokerPointer () override |
| std::string | GetTypeString () const override |
| Public Member Functions inherited from ck::tensor_operation::device::BaseOperator | |
| BaseOperator ()=default | |
| BaseOperator (const BaseOperator &)=default | |
| BaseOperator & | operator= (const BaseOperator &)=default |
| virtual std::string | GetInstanceString () const |
| virtual std::string | GetTypeIdName () const |
| virtual std::optional< std::string > | GetObjectName () const |
| virtual std::optional< std::string > | GetTemplateInfo () const |
| virtual std::string | GetTypeIdHashCode () const |
| virtual size_t | GetWorkSpaceSize (const BaseArgument *) const |
| virtual void | SetWorkSpacePointer (BaseArgument *p_arg, void *p_workspace, const StreamConfig &=StreamConfig{}) const |
| virtual | ~BaseOperator () |
Static Public Member Functions | |
| static auto | MakeSrc2dDescriptor (const std::vector< index_t > &inLengths, const std::vector< index_t > &inStrides, int blkGroupSize, int numBlockTileIteration) |
| static bool | IsSupportedArgument (const Argument &arg) |
| static auto | MakeArgument (const std::vector< index_t > inLengths, const std::vector< index_t > inStrides, const std::vector< int > reduceDims, double alpha, double beta, const InDataType *in_dev, OutDataType *out_dev, InElementwiseOp in_elementwise_op, AccElementwiseOp acc_elementwise_op) |
| static auto | MakeInvoker () |
Static Public Attributes | |
| static constexpr index_t | NumInvariantDim = Rank - NumReduceDim |
| static constexpr index_t | NumSrcDim = Rank |
| static constexpr index_t | NumDstDim = (NumInvariantDim == 0) ? 1 : NumInvariantDim |
| static constexpr bool | reduceAllDim = (NumInvariantDim == 0) |
| static constexpr index_t | M_BlockTileSize = MThreadClusterSize * MThreadSliceSize |
| static constexpr index_t | K_BlockTileSize = KThreadClusterSize * KThreadSliceSize |
Member Typedef Documentation
◆ GridDesc_M_K
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
| using ck::tensor_operation::device::DeviceSoftmaxImpl< InDataType, AccDataType, OutDataType, InElementwiseOp, AccElementwiseOp, Rank, NumReduceDim, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, InSrcVectorDim, InSrcVectorSize, OutDstVectorSize >::GridDesc_M_K = decltype(MakeSrc2dDescriptor({1}, {1}, 1, 1)) |
◆ GridwiseSoftmaxGeneric
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
| using ck::tensor_operation::device::DeviceSoftmaxImpl< InDataType, AccDataType, OutDataType, InElementwiseOp, AccElementwiseOp, Rank, NumReduceDim, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, InSrcVectorDim, InSrcVectorSize, OutDstVectorSize >::GridwiseSoftmaxGeneric |
Initial value:
GridwiseSoftmax_mk_to_mk<InDataType,
OutDataType,
AccDataType,
BlockSize,
MThreadClusterSize,
KThreadClusterSize,
MThreadSliceSize,
KThreadSliceSize,
InSrcVectorDim,
InSrcVectorSize,
OutDstVectorSize,
false>
Definition gridwise_softmax.hpp:55
decltype(MakeSrc2dDescriptor({1}, {1}, 1, 1)) GridDesc_M_K
Definition device_softmax_impl.hpp:117
◆ GridwiseSoftmaxSweepOnce
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
| using ck::tensor_operation::device::DeviceSoftmaxImpl< InDataType, AccDataType, OutDataType, InElementwiseOp, AccElementwiseOp, Rank, NumReduceDim, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, InSrcVectorDim, InSrcVectorSize, OutDstVectorSize >::GridwiseSoftmaxSweepOnce |
Initial value:
GridwiseSoftmax_mk_to_mk<InDataType,
OutDataType,
AccDataType,
BlockSize,
MThreadClusterSize,
KThreadClusterSize,
MThreadSliceSize,
KThreadSliceSize,
InSrcVectorDim,
InSrcVectorSize,
OutDstVectorSize,
true>
Member Function Documentation
◆ GetTypeString()
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
|
inlineoverridevirtual |
Reimplemented from ck::tensor_operation::device::BaseOperator.
◆ IsSupportedArgument() [1/2]
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
|
inlinestatic |
◆ IsSupportedArgument() [2/2]
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
|
inlineoverridevirtual |
Reimplemented from ck::tensor_operation::device::BaseOperator.
◆ MakeArgument()
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
|
inlinestatic |
◆ MakeArgumentPointer()
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
|
inlineoverridevirtual |
◆ MakeInvoker()
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
|
inlinestatic |
◆ MakeInvokerPointer()
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
|
inlineoverridevirtual |
◆ MakeSrc2dDescriptor()
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
|
inlinestatic |
Member Data Documentation
◆ K_BlockTileSize
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
|
staticconstexpr |
◆ M_BlockTileSize
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
|
staticconstexpr |
◆ NumDstDim
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
|
staticconstexpr |
◆ NumInvariantDim
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
|
staticconstexpr |
◆ NumSrcDim
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
|
staticconstexpr |
◆ reduceAllDim
template<typename InDataType, typename AccDataType, typename OutDataType, typename InElementwiseOp, typename AccElementwiseOp, index_t Rank, index_t NumReduceDim, index_t BlockSize, index_t MThreadClusterSize, index_t KThreadClusterSize, index_t MThreadSliceSize, index_t KThreadSliceSize, index_t InSrcVectorDim, index_t InSrcVectorSize, index_t OutDstVectorSize>
|
staticconstexpr |
The documentation for this struct was generated from the following file: