warp_gemm_impl.hpp Source File#
warp_gemm_impl.hpp
Go to the documentation of this file.
constexpr bool is_similiar_distributed_tensor_v
Definition static_distributed_tensor.hpp:230
Definition tile/core/algorithm/cluster_descriptor.hpp:13
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition type_traits.hpp:21
constant< b > bool_constant
Definition tile/core/numeric/integral_constant.hpp:43
typename impl::ext_vector< T, N >::type ext_vector_t
Definition vector_type.hpp:84
CK_TILE_HOST_DEVICE constexpr auto make_static_tile_distribution(StaticTileDistributionEncoding_)
Definition tile_distribution.hpp:480
Definition warp_gemm_impl.hpp:11
CK_TILE_DEVICE void operator()(CTensor &c, const ATensor &a, const BTensor &b, number< i_subk >, bool_constant< post_nop_ >={}) const
Definition warp_gemm_impl.hpp:73
typename WarpGemmAttribute::CWarpDstrEncoding CWarpDstrEncoding
Definition warp_gemm_impl.hpp:30
CK_TILE_DEVICE auto operator()(const ATensor &a, const BTensor &b) const
Definition warp_gemm_impl.hpp:129
typename WarpGemmAttribute::BWarpDstrEncoding BWarpDstrEncoding
Definition warp_gemm_impl.hpp:29
remove_cvref_t< decltype(make_static_tile_distribution(BWarpDstrEncoding{}))> BWarpDstr
Definition warp_gemm_impl.hpp:33
CK_TILE_DEVICE auto operator()(const ATensor &a, const BTensor &b, const int32_t &a_scale, const int32_t &b_scale) const
Definition warp_gemm_impl.hpp:154
static constexpr index_t kKPerThread
Definition warp_gemm_impl.hpp:22
typename WarpGemmAttribute::AWarpDstrEncoding AWarpDstrEncoding
Definition warp_gemm_impl.hpp:28
CK_TILE_DEVICE void operator()(CTensor &c, const ATensor &a, const BTensor &b, bool_constant< post_nop_ >={}) const
Definition warp_gemm_impl.hpp:47
static constexpr index_t kM
Definition warp_gemm_impl.hpp:14
static constexpr index_t kK
Definition warp_gemm_impl.hpp:16
static constexpr index_t kCMLane
Definition warp_gemm_impl.hpp:17
typename WarpGemmAttribute::CDataType CDataType
Definition warp_gemm_impl.hpp:26
typename WarpGemmAttribute::ADataType ADataType
Definition warp_gemm_impl.hpp:24
remove_cvref_t< decltype(make_static_tile_distribution(CWarpDstrEncoding{}))> CWarpDstr
Definition warp_gemm_impl.hpp:34
static_distributed_tensor< ADataType, AWarpDstr > AWarpTensor
Definition warp_gemm_impl.hpp:36
static_distributed_tensor< BDataType, BWarpDstr > BWarpTensor
Definition warp_gemm_impl.hpp:37
static constexpr index_t kN
Definition warp_gemm_impl.hpp:15
remove_cvref_t< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImplF32F32F32M16N16K4< WGAttrCtlEnum::Default_ > > > WarpGemmAttribute
Definition warp_gemm_impl.hpp:12
remove_cvref_t< decltype(make_static_tile_distribution(AWarpDstrEncoding{}))> AWarpDstr
Definition warp_gemm_impl.hpp:32
static_distributed_tensor< CDataType, CWarpDstr > CWarpTensor
Definition warp_gemm_impl.hpp:38
typename WarpGemmAttribute::BDataType BDataType
Definition warp_gemm_impl.hpp:25
CK_TILE_DEVICE void operator()(CTensor &c, const ATensor &a, const BTensor &b, const int32_t &a_scale, const int32_t &b_scale, bool_constant< post_nop_ >={}) const
Definition warp_gemm_impl.hpp:101
static CK_TILE_HOST_DEVICE constexpr auto get_num_of_access()
Definition warp_gemm_impl.hpp:40
Definition static_distributed_tensor.hpp:21