gemm_group_quant_utils.hpp Source File#
gemm_group_quant_utils.hpp
Go to the documentation of this file.
Definition tile/core/algorithm/cluster_descriptor.hpp:13
auto concat(const Ts &... xs) -> std::enable_if_t<!AllConvertibleToStringView< Ts... >, std::string >
Definition concat.hpp:43
CK_TILE_HOST_DEVICE constexpr auto make_static_tile_distribution(StaticTileDistributionEncoding_)
Definition tile_distribution.hpp:480
Definition gemm_group_quant_utils.hpp:267
static CK_TILE_HOST const std::string GetName()
Definition gemm_group_quant_utils.hpp:272
Definition tile/core/container/sequence.hpp:49
Definition gemm_group_quant_utils.hpp:124
static constexpr index_t NWarps
Definition gemm_group_quant_utils.hpp:131
static constexpr index_t MWarps
Definition gemm_group_quant_utils.hpp:130
static constexpr index_t MIterPerWarp
Definition gemm_group_quant_utils.hpp:134
static constexpr index_t X
Definition gemm_group_quant_utils.hpp:142
static CK_TILE_HOST_DEVICE constexpr auto make_2d_static_tile_distribution()
Definition gemm_group_quant_utils.hpp:156
static constexpr index_t KWarps
Definition gemm_group_quant_utils.hpp:132
static constexpr index_t Y0
Definition gemm_group_quant_utils.hpp:147
static constexpr index_t num_warps
Definition gemm_group_quant_utils.hpp:128
static constexpr index_t Y2
Definition gemm_group_quant_utils.hpp:152
static constexpr index_t Y1
Definition gemm_group_quant_utils.hpp:150
static constexpr index_t XR
Definition gemm_group_quant_utils.hpp:143
static constexpr index_t warp_size
Definition gemm_group_quant_utils.hpp:127
Definition gemm_group_quant_utils.hpp:57
static constexpr index_t KWarps
Definition gemm_group_quant_utils.hpp:64
static constexpr index_t MWarps
Definition gemm_group_quant_utils.hpp:62
static CK_TILE_HOST_DEVICE constexpr auto make_2d_static_tile_distribution()
Definition gemm_group_quant_utils.hpp:73
static constexpr index_t warp_size
Definition gemm_group_quant_utils.hpp:59
static constexpr index_t NWarps
Definition gemm_group_quant_utils.hpp:63
static constexpr index_t num_warps
Definition gemm_group_quant_utils.hpp:60
static constexpr index_t MIterPerWarp
Definition gemm_group_quant_utils.hpp:66
Definition gemm_group_quant_utils.hpp:176
static constexpr index_t num_warps
Definition gemm_group_quant_utils.hpp:178
static constexpr index_t NWarps
Definition gemm_group_quant_utils.hpp:181
static constexpr index_t warp_size
Definition gemm_group_quant_utils.hpp:177
static constexpr index_t MWarps
Definition gemm_group_quant_utils.hpp:180
static CK_TILE_HOST_DEVICE constexpr auto make_2d_static_tile_distribution()
Creates a 2D tile distribution for BQ (B-matrix quantization scales).
Definition gemm_group_quant_utils.hpp:214
static constexpr index_t KWarps
Definition gemm_group_quant_utils.hpp:182
static constexpr index_t NIterPerWarp
Definition gemm_group_quant_utils.hpp:184
Definition static_encoding_pattern.hpp:108
Definition tile_distribution_encoding.hpp:26
Definition tile/core/container/tuple.hpp:192