warp_gemm_smfmac_impl.hpp Source File#
warp_gemm_smfmac_impl.hpp
Go to the documentation of this file.
constexpr bool is_similiar_distributed_tensor_v
Definition static_distributed_tensor.hpp:230
Definition tile/core/algorithm/cluster_descriptor.hpp:13
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition type_traits.hpp:21
constant< b > bool_constant
Definition tile/core/numeric/integral_constant.hpp:43
typename impl::ext_vector< T, N >::type ext_vector_t
Definition vector_type.hpp:84
CK_TILE_HOST_DEVICE constexpr auto make_static_tile_distribution(StaticTileDistributionEncoding_)
Definition tile_distribution.hpp:480
Definition warp_gemm_smfmac_impl.hpp:11
CK_TILE_DEVICE void operator()(CTensor &c, const ATensor &a, const BTensor &b, bool_constant< post_nop_ >={}) const
Definition warp_gemm_smfmac_impl.hpp:79
static constexpr index_t kK
Definition warp_gemm_smfmac_impl.hpp:16
typename WarpGemmAttribute::BDataType BDataType
Definition warp_gemm_smfmac_impl.hpp:24
typename WarpGemmAttribute::BWarpDstrEncoding BWarpDstrEncoding
Definition warp_gemm_smfmac_impl.hpp:28
static_distributed_tensor< CDataType, CWarpDstr > CWarpTensor
Definition warp_gemm_smfmac_impl.hpp:37
typename WarpGemmAttribute::ADataType ADataType
Definition warp_gemm_smfmac_impl.hpp:23
static_distributed_tensor< BDataType, BWarpDstr > BWarpTensor
Definition warp_gemm_smfmac_impl.hpp:36
remove_cvref_t< decltype(make_static_tile_distribution(BWarpDstrEncoding{}))> BWarpDstr
Definition warp_gemm_smfmac_impl.hpp:32
static constexpr index_t kM
Definition warp_gemm_smfmac_impl.hpp:14
remove_cvref_t< decltype(make_static_tile_distribution(CWarpDstrEncoding{}))> CWarpDstr
Definition warp_gemm_smfmac_impl.hpp:33
static constexpr index_t kKPerThread
Definition warp_gemm_smfmac_impl.hpp:21
static_distributed_tensor< ADataType, AWarpDstr > AWarpTensor
Definition warp_gemm_smfmac_impl.hpp:35
typename WarpGemmAttribute::CWarpDstrEncoding CWarpDstrEncoding
Definition warp_gemm_smfmac_impl.hpp:29
CK_TILE_DEVICE int32_t compress_a(AVec &a_vec) const
Compress A vector for 2:4 structured sparsity instruction by moving all non-zero elements into lower ...
Definition warp_gemm_smfmac_impl.hpp:53
static CK_TILE_HOST_DEVICE constexpr auto get_num_of_access()
Definition warp_gemm_smfmac_impl.hpp:39
typename WarpGemmAttribute::CDataType CDataType
Definition warp_gemm_smfmac_impl.hpp:25
remove_cvref_t< decltype(make_static_tile_distribution(AWarpDstrEncoding{}))> AWarpDstr
Definition warp_gemm_smfmac_impl.hpp:31
typename WarpGemmAttribute::AWarpDstrEncoding AWarpDstrEncoding
Definition warp_gemm_smfmac_impl.hpp:27
static constexpr index_t kN
Definition warp_gemm_smfmac_impl.hpp:15
remove_cvref_t< WarpGemmAttributeSmfmac< WarpGemmAttributeSmfmacImplF16F16F32M32N32K16< WGAttrCtlEnum::Default_ > > > WarpGemmAttribute
Definition warp_gemm_smfmac_impl.hpp:12
Definition static_distributed_tensor.hpp:21
Definition tile/core/utility/functional.hpp:43