gridwise_gemm_xdlops_bwd_weight.hpp File Reference#
gridwise_gemm_xdlops_bwd_weight.hpp File Reference
#include "ck/utility/common_header.hpp"#include "ck/tensor_description/multi_index_transform_helper.hpp"#include "ck/tensor_description/tensor_descriptor.hpp"#include "ck/tensor_description/tensor_descriptor_helper.hpp"#include "ck/tensor_operation/gpu/grid/block_to_ctile_map.hpp"#include "ck/tensor_operation/gpu/grid/gridwise_gemm_pipeline_selector.hpp"#include "ck/tensor_operation/gpu/block/blockwise_gemm_xdlops.hpp"#include "ck/tensor_operation/gpu/block/thread_group_tensor_slice_transfer_v4r1.hpp"#include "ck/tensor_operation/gpu/block/thread_group_tensor_slice_transfer_v6r1.hpp"#include "ck/tensor_operation/gpu/thread/threadwise_tensor_slice_transfer.hpp"#include "ck/tensor_operation/gpu/element/element_wise_operation.hpp"Go to the source code of this file.
Namespaces | |
| namespace | ck |
Functions | |
| template<typename LowLengths> | |
| __host__ __device__ constexpr auto | ck::make_merge_transform_v4_no_carry (const LowLengths &low_lengths) |
| template<typename GridwiseGemm, typename FloatA, typename FloatB, typename FloatC, typename AGridDesc_B_K0_M_K1, typename BGridDesc_B_K0_N_K1, typename CGridDesc_MBlock_MPerBlock_NBlock_NPerBlock, typename AElementwiseOperation, typename BElementwiseOperation, typename CElementwiseOperation, typename CBlockClusterAdaptor, bool HasMainKBlockLoop> | |
| __global__ void | ck::kernel_gemm_xdlops_bwd_weight (const FloatA *__restrict__ p_a_grid, const FloatB *__restrict__ p_b_grid, FloatC *__restrict__ p_c_grid, const AGridDesc_B_K0_M_K1 a_b_k0_m_k1_grid_desc, const BGridDesc_B_K0_N_K1 b_b_k0_n_k1_grid_desc, const CGridDesc_MBlock_MPerBlock_NBlock_NPerBlock c_grid_desc_mblock_mperblock_nblock_nperblock, const AElementwiseOperation a_element_op, const BElementwiseOperation b_element_op, const CElementwiseOperation c_element_op, const CBlockClusterAdaptor c_block_cluster_adaptor) |