block_fmha_bwd_convert_dq.hpp Source File#
block_fmha_bwd_convert_dq.hpp
Go to the documentation of this file.
Definition tile/core/algorithm/cluster_descriptor.hpp:13
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition type_traits.hpp:21
CK_TILE_HOST_DEVICE constexpr auto make_static_distributed_tensor(const StaticTileDistribution &)
Definition static_distributed_tensor.hpp:142
CK_TILE_DEVICE constexpr auto make_tile_window(null_tensor_view, const WindowLengths &window_lengths, const multi_index< WindowLengths::size()> &, Ts &&...)
Definition null_tile_window.hpp:75
CK_TILE_DEVICE auto cast_tile(const SrcTensor &src_tensor)
Definition tile_elementwise.hpp:327
CK_TILE_DEVICE void sweep_tile_span(TileDistributedSpan_, const F &f)
Definition sweep_tile.hpp:20
CK_TILE_DEVICE void move_tile_window(null_tile_window< WindowLengths > &, const typename null_tile_window< WindowLengths >::BottomTensorIndex &)
Definition null_tile_window.hpp:95
CK_TILE_DEVICE void store_tile(tile_window_with_static_lengths< BottomTensorView_, WindowLengths_ > &tile_window_tmp, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor)
Definition store_tile.hpp:23
CK_TILE_DEVICE void clear_tile(DstrTensors &dstr_tensor)
Definition tile_elementwise.hpp:177
CK_TILE_HOST_DEVICE constexpr Y type_convert(X x)
Definition tile/core/numeric/type_convert.hpp:29
CK_TILE_DEVICE auto load_tile(const TileWindow_ &tile_window, number< i_access >={}, bool_constant< oob_conditional_check >={})
Definition load_tile.hpp:22
CK_TILE_HOST_DEVICE constexpr auto make_tuple(Xs &&... xs)
Definition tile/core/container/tuple.hpp:360
Definition block_fmha_bwd_convert_dq.hpp:13
static constexpr bool kPadSeqLenQ
Definition block_fmha_bwd_convert_dq.hpp:25
static CK_TILE_HOST_DEVICE constexpr ck_tile::index_t GetSmemSize()
Definition block_fmha_bwd_convert_dq.hpp:34
static constexpr bool kIsDeterministic
Definition block_fmha_bwd_convert_dq.hpp:27
remove_cvref_t< typename Problem::AccDataType > AccDataType
Definition block_fmha_bwd_convert_dq.hpp:14
static constexpr index_t kAlignmentQGradAcc
Definition block_fmha_bwd_convert_dq.hpp:29
remove_cvref_t< typename Problem::QGradDataType > QGradDataType
Definition block_fmha_bwd_convert_dq.hpp:15
static constexpr index_t kBlockSize
Definition block_fmha_bwd_convert_dq.hpp:21
static constexpr index_t kM0
Definition block_fmha_bwd_convert_dq.hpp:17
static constexpr bool kPadHeadDimQ
Definition block_fmha_bwd_convert_dq.hpp:26
static constexpr index_t kBlockPerCu
Definition block_fmha_bwd_convert_dq.hpp:20
static constexpr index_t kAlignmentQGrad
Definition block_fmha_bwd_convert_dq.hpp:31
static constexpr index_t kN0
Definition block_fmha_bwd_convert_dq.hpp:18
CK_TILE_HOST_DEVICE void operator()(const QGradAccDramBlockWindowTmp &dq_acc_dram_block_window_tmp, QGradDramBlockWindowTmp &dq_dram_block_window_tmp, index_t nsplits) const
Definition block_fmha_bwd_convert_dq.hpp:66
static constexpr index_t kQKHeaddim
Definition block_fmha_bwd_convert_dq.hpp:22
CK_TILE_HOST_DEVICE void operator()(const QGradAccDramBlockWindowTmp &dq_acc_dram_block_window_tmp, QGradDramBlockWindowTmp &dq_dram_block_window_tmp) const
Definition block_fmha_bwd_convert_dq.hpp:39
static constexpr bool kIsGroupMode
Definition block_fmha_bwd_convert_dq.hpp:24