grid Directory Reference

grid Directory Reference#

Composable Kernel: grid Directory Reference
grid Directory Reference

Directories

 
batchnorm_multiblock
 
gemm_layernorm
 
normalization

Files

 
block_to_ctile_map.hpp
 
epilogue_cshuffle_v3_welford_wmma.hpp
 
epilogue_cshuffle_v3_wmma.hpp
 
epilogue_cshuffle_v3_wmma_base.hpp
 
gridwise_2d_multiple_reduction_multiblock.hpp
 
gridwise_2d_multiple_reduction_threadwise.hpp
 
gridwise_2d_reduction_multiblock.hpp
 
gridwise_2d_reduction_threadwise.hpp
 
gridwise_2d_reduction_threadwise_multi_d.hpp
 
gridwise_ab_transfer_thread_tiles.hpp
 
gridwise_ab_transfer_wave_tiles.hpp
 
gridwise_batched_gemm_gemm_wmma_cshuffle_v3.hpp
 
gridwise_batched_gemm_gemm_xdl_cshuffle_v1.hpp
 
gridwise_batched_gemm_multiple_d_gemm_multiple_d_xdl_cshuffle_v1.hpp
 
gridwise_batched_gemm_multiple_d_softmax_gemm_xdl_cshuffle_v1.hpp
 
gridwise_batched_gemm_softmax_gemm_wmma_cshuffle.hpp
 
gridwise_batched_gemm_softmax_gemm_xdl_cshuffle_v1.hpp
 
gridwise_batchnorm_backward_blockwise_welford.hpp
 
gridwise_batchnorm_forward_blockwise_welford.hpp
 
gridwise_elementwise_1d_scale.hpp
 
gridwise_elementwise_2d.hpp
 
gridwise_elementwise_layernorm_welford_variance.hpp
 
gridwise_fpAintB_gemm_wmma.hpp
 
gridwise_gemm_bias_add_reduce_xdl_cshuffle_v1.hpp
 
gridwise_gemm_dl_multiple_d.hpp
 
gridwise_gemm_dl_v1r3.hpp
 
gridwise_gemm_dpp.hpp
 
gridwise_gemm_multiple_abd_xdl_cshuffle.hpp
 
gridwise_gemm_multiple_d_multiple_r_xdl_cshuffle.hpp
 
gridwise_gemm_multiple_d_wmma_cshuffle.hpp
 
gridwise_gemm_multiple_d_xdl_cshuffle.hpp
 
gridwise_gemm_multiple_d_xdl_cshuffle_lds_direct_load.hpp
 
gridwise_gemm_multiple_d_xdl_splitk_cshuffle.hpp
 
gridwise_gemm_pipeline_selector.hpp
 
gridwise_gemm_pipeline_v1.hpp
 
gridwise_gemm_pipeline_v2.hpp
 
gridwise_gemm_pipeline_v3.hpp
 
gridwise_gemm_pipeline_v4_direct_load.hpp
 
gridwise_gemm_reduce_xdl_cshuffle_v1.hpp
 
gridwise_gemm_split_k_multiple_d_xdl_cshuffle.hpp
 
gridwise_gemm_split_k_multiple_d_xdl_cshuffle_v2.hpp
 
gridwise_gemm_waveletmodel.hpp
 
gridwise_gemm_wmma.hpp
 
gridwise_gemm_wmma_cshuffle_v3.hpp
 
gridwise_gemm_wmma_cshuffle_v3_b_scale.hpp
 
gridwise_gemm_wmma_cshuffle_v3_common.hpp
 
gridwise_gemm_xdl_cshuffle_conv_v3.hpp
 
gridwise_gemm_xdl_cshuffle_streamk_v3.hpp
 
gridwise_gemm_xdl_cshuffle_v1.hpp
 
gridwise_gemm_xdl_cshuffle_v2.hpp
 
gridwise_gemm_xdl_cshuffle_v3.hpp
 
gridwise_gemm_xdl_cshuffle_v3_b_preshuffle.hpp
 
gridwise_gemm_xdl_cshuffle_v3_b_scale.hpp
 
gridwise_gemm_xdl_cshuffle_v3_multi_abd.hpp
 
gridwise_gemm_xdl_cshuffle_v3_multi_d.hpp
 
gridwise_gemm_xdl_cshuffle_v3_multi_d_ab_scale.hpp
 
gridwise_gemm_xdl_cshuffle_v3_multi_d_b_preshuffle.hpp
 
gridwise_gemm_xdl_cshuffle_v3_multi_d_blockscale_b_preshuffle.hpp
 
gridwise_gemm_xdl_cshuffle_v3_mx.hpp
 
gridwise_gemm_xdl_cshuffle_v3_mx_bpreshuffle.hpp
 
gridwise_gemm_xdl_layernorm_cshuffle_v1.hpp
 
gridwise_gemm_xdl_waveletmodel_cshuffle.hpp
 
gridwise_gemm_xdlops_bwd_weight.hpp
 
gridwise_gemm_xdlops_skip_b_lds_v1.hpp
 
gridwise_gemm_xdlops_splitk_lds_direct_load.hpp
 
gridwise_gemm_xdlops_streamk.hpp
 
gridwise_gemm_xdlops_v2r3.hpp
 
gridwise_gemm_xdlops_v2r4.hpp
 
gridwise_gemm_xdlops_v2r4r2.hpp
 
gridwise_gemm_xdlops_v3r1.hpp
 
gridwise_gemm_xdlops_v3r2.hpp
 
gridwise_gemm_xdlops_v3r3.hpp
 
gridwise_moe_gemm.hpp
 
gridwise_moe_gemm_blockscale.hpp
 
gridwise_moe_mx_gemm.hpp
 
gridwise_moe_mx_gemm_bns.hpp
 
gridwise_moe_mx_gemm_bpreshuffle.hpp
 
gridwise_permute.hpp
 
gridwise_put_element_1d.hpp
 
gridwise_set_buffer_value.hpp
 
gridwise_set_multiple_buffer_value.hpp
 
gridwise_softmax.hpp
 
gridwise_sparse_embeddings_forward_layernorm.hpp
 
gridwise_sparse_embeddings_forward_layernorm_builtins.hpp
 
gridwise_tensor_rearrange.hpp