gemm_quant_pipeline_problem.hpp Source File#
gemm_quant_pipeline_problem.hpp
Go to the documentation of this file.
Definition tile/core/algorithm/cluster_descriptor.hpp:13
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition type_traits.hpp:21
GemmQuantPipelineProblemBase< ADataType_, AccDataType_, BDataType_, AccDataType_, CDataType_, BlockGemmShape_, Traits_, QuantGroupShape< sequence< 1, 1, 1 > >, TransposeC_, ComputeDataType_, Scheduler_, HasHotLoop_, TailNum_ > GemmRowColTensorQuantPipelineProblem
Definition gemm_quant_pipeline_problem.hpp:171
auto concat(const Ts &... xs) -> std::enable_if_t<!AllConvertibleToStringView< Ts... >, std::string >
Definition concat.hpp:43
GemmQuantPipelineProblemBase< ADataType_, AQDataType_, BDataType_, void, CDataType_, BlockGemmShape_, Traits_, QuantGroupSize_, TransposeC_, ComputeDataType_, Scheduler_, HasHotLoop_, TailNum_ > GemmAQuantPipelineProblem
Definition gemm_quant_pipeline_problem.hpp:121
GemmPipelineScheduler
Definition gemm_pipeline_ag_bg_cr_scheduler.hpp:14
@ Intrawave
Definition gemm_pipeline_ag_bg_cr_scheduler.hpp:16
GemmQuantPipelineProblemBase< ADataType_, void, BDataType_, BQDataType_, CDataType_, BlockGemmShape_, Traits_, QuantGroupSize_, false, ComputeDataType_, Scheduler_, HasHotLoop_, TailNum_ > GemmBQuantPipelineProblem
Definition gemm_quant_pipeline_problem.hpp:146
Definition gemm_pipeline_problem.hpp:25
remove_cvref_t< std::tuple_element_t< number< 0 >{}, BsDataTypeTuple > > BDataType
Definition gemm_pipeline_problem.hpp:69
remove_cvref_t< BlockGemmShape_ > BlockGemmShape
Definition gemm_pipeline_problem.hpp:34
remove_cvref_t< std::tuple_element_t< number< 0 >{}, ComputeDataTypeTuple > > ComputeDataType
Definition gemm_pipeline_problem.hpp:66
static constexpr bool kPadK
Definition gemm_pipeline_problem.hpp:80
remove_cvref_t< std::tuple_element_t< number< 0 >{}, AsLayoutTuple > > ALayout
Definition gemm_pipeline_problem.hpp:68
remove_cvref_t< std::tuple_element_t< number< 0 >{}, AsDataTypeTuple > > ADataType
Definition gemm_pipeline_problem.hpp:67
static constexpr index_t kBlockSize
Definition gemm_pipeline_problem.hpp:76
static constexpr bool kPadM
Definition gemm_pipeline_problem.hpp:78
remove_cvref_t< std::tuple_element_t< number< 0 >{}, BsLayoutTuple > > BLayout
Definition gemm_pipeline_problem.hpp:70
remove_cvref_t< typename Traits::CLayout > CLayout
Definition gemm_pipeline_problem.hpp:41
remove_cvref_t< CDataType_ > CDataType
Definition gemm_pipeline_problem.hpp:30
remove_cvref_t< Traits_ > Traits
Definition gemm_pipeline_problem.hpp:26
static constexpr bool kPadN
Definition gemm_pipeline_problem.hpp:79
static constexpr index_t VectorLoadSize
Definition gemm_pipeline_problem.hpp:84
Definition gemm_quant_pipeline_problem.hpp:33
static constexpr bool kPadN
static constexpr bool PreshuffleB
Definition gemm_quant_pipeline_problem.hpp:58
remove_cvref_t< BQDataType_ > BQDataType
Definition gemm_quant_pipeline_problem.hpp:48
remove_cvref_t< AQDataType_ > AQDataType
Definition gemm_quant_pipeline_problem.hpp:47
remove_cvref_t< typename Traits::BQLayout > BQLayout
Definition gemm_quant_pipeline_problem.hpp:69
static CK_TILE_HOST_DEVICE constexpr auto GetAlignmentAQ()
Definition gemm_quant_pipeline_problem.hpp:90
static constexpr bool TransposeC
Definition gemm_quant_pipeline_problem.hpp:57
remove_cvref_t< typename Traits::AQLayout > AQLayout
Definition gemm_quant_pipeline_problem.hpp:68
typename Base::BlockGemmShape BlockGemmShape
Definition gemm_quant_pipeline_problem.hpp:50
static constexpr auto Scheduler
Definition gemm_quant_pipeline_problem.hpp:71
static constexpr index_t VectorSizeBQ
Definition gemm_quant_pipeline_problem.hpp:106
static constexpr index_t kBlockSize
static constexpr auto TailNum
Definition gemm_quant_pipeline_problem.hpp:73
QuantGroupSize_ QuantGroupSize
Definition gemm_quant_pipeline_problem.hpp:51
static constexpr bool DoubleSmemBuffer
Definition gemm_quant_pipeline_problem.hpp:59
static CK_TILE_HOST const std::string GetName()
Definition gemm_quant_pipeline_problem.hpp:79
typename Base::Traits Traits
Definition gemm_quant_pipeline_problem.hpp:41
GemmPipelineProblemBase< ADataType_, BDataType_, CDataType_, BlockGemmShape_, Traits_, ComputeDataType_ > Base
Definition gemm_quant_pipeline_problem.hpp:34
static constexpr bool kPadK
static CK_TILE_HOST_DEVICE constexpr auto GetAlignmentBQ()
Definition gemm_quant_pipeline_problem.hpp:101
static constexpr index_t VectorLoadSize
static constexpr index_t VectorSizeAQ
Definition gemm_quant_pipeline_problem.hpp:96
static constexpr bool kPadM
static constexpr auto HasHotLoop
Definition gemm_quant_pipeline_problem.hpp:72
Definition gemm_group_quant_utils.hpp:267