device_gemm_multiple_d_wmma_cshuffle_v3.hpp Source File#
device_gemm_multiple_d_wmma_cshuffle_v3.hpp
Go to the documentation of this file.
Definition convolution_backward_data_specialization.hpp:8
std::string getGemmSpecializationString(const GemmSpecialization &s)
Definition gemm_specialization.hpp:32
GemmSpecialization
Definition gemm_specialization.hpp:11
Definition convolution_backward_data_specialization.hpp:7
Definition ck.hpp:268
typename tuple_element< I, TTuple >::type tuple_element_t
Definition utility/tuple.hpp:208
static constexpr index_t KPack
Definition gridwise_gemm_wmma_cshuffle_v3_common.hpp:154
"Universal" GEMM kernel with SplitK support.
Definition gridwise_gemm_wmma_cshuffle_v3.hpp:233
Definition utility/tuple.hpp:117
Definition functional2.hpp:33
Definition device_base.hpp:197
Definition device_gemm_wmma_cshuffle_v3_common.hpp:43
static bool IsSupportedArgument(const Argument &arg)
Definition device_gemm_wmma_cshuffle_v3_common.hpp:268
"Universal" GEMM operation with SplitK support and multiple D tensors.
Definition device_gemm_multiple_d_wmma_cshuffle_v3.hpp:188
bool IsSupportedArgument(const BaseArgument *p_arg) override
Definition device_gemm_multiple_d_wmma_cshuffle_v3.hpp:273
static auto MakeArgument(const void *p_a, const void *p_b, std::array< const void *, NumDTensor > p_ds, void *p_e, index_t M, index_t N, index_t K, index_t StrideA, index_t StrideB, std::array< index_t, NumDTensor > StrideDs, index_t StrideE, index_t KBatch, AElementwiseOperation a_element_op, BElementwiseOperation b_element_op, CDEElementwiseOperation cde_element_op)
Definition device_gemm_multiple_d_wmma_cshuffle_v3.hpp:278
static bool IsSupportedArgument(const Argument &arg)
Definition device_gemm_multiple_d_wmma_cshuffle_v3.hpp:267
DeviceGemm_Wmma_CShuffleV3_Common< GridwiseGemm, Tuple< ADataType >, Tuple< BDataType >, DsDataType, EDataType, MPerBlock, NPerBlock, KPerBlock, BlockSize, AK1, BK1, GemmSpec, CDEShuffleBlockTransferScalarPerVectors, BlkGemmPipeSched, BlkGemmPipelineVer, ComputeTypeA, ComputeTypeB > DeviceGemmCommon
Definition device_gemm_multiple_d_wmma_cshuffle_v3.hpp:245
std::string GetTypeString() const override
Definition device_gemm_multiple_d_wmma_cshuffle_v3.hpp:355
typename DeviceGemmCommon::Invoker Invoker
Definition device_gemm_multiple_d_wmma_cshuffle_v3.hpp:265
std::unique_ptr< BaseArgument > MakeArgumentPointer(const void *p_a, const void *p_b, std::array< const void *, NumDTensor > p_ds, void *p_e, index_t M, index_t N, index_t K, index_t StrideA, index_t StrideB, std::array< ck::index_t, NumDTensor > StrideDs, index_t StrideE, index_t KBatch, AElementwiseOperation a_element_op, BElementwiseOperation b_element_op, CDEElementwiseOperation cde_element_op) override
Definition device_gemm_multiple_d_wmma_cshuffle_v3.hpp:315
static constexpr index_t NumDTensor
Definition device_gemm_multiple_d_wmma_cshuffle_v3.hpp:189
static auto MakeInvoker()
Definition device_gemm_multiple_d_wmma_cshuffle_v3.hpp:311
std::unique_ptr< BaseInvoker > MakeInvokerPointer() override
Definition device_gemm_multiple_d_wmma_cshuffle_v3.hpp:349
typename GridwiseGemm::Argument Argument
Definition device_gemm_multiple_d_wmma_cshuffle_v3.hpp:243
GridwiseGemm_wmma_cshuffle_v3< ALayout, BLayout, DsLayout, ELayout, Tuple< ADataType >, Tuple< BDataType >, AccDataType, CShuffleDataType, DsDataType, EDataType, AElementwiseOperation, BElementwiseOperation, CDEElementwiseOperation, GemmSpec, BlockSize, MPerBlock, NPerBlock, KPerBlock, AK1, BK1, MPerWmma, NPerWmma, MRepeat, NRepeat, ABlockTransferThreadClusterLengths_AK0_M_AK1, ABlockTransferThreadClusterArrangeOrder, ABlockTransferSrcAccessOrder, ABlockTransferSrcVectorDim, ABlockTransferSrcScalarPerVector, ABlockTransferDstScalarPerVector_AK1, false, ABlockLdsExtraM, BBlockTransferThreadClusterLengths_BK0_N_BK1, BBlockTransferThreadClusterArrangeOrder, BBlockTransferSrcAccessOrder, BBlockTransferSrcVectorDim, BBlockTransferSrcScalarPerVector, BBlockTransferDstScalarPerVector_BK1, false, BBlockLdsExtraN, CShuffleMRepeatPerShuffle, CShuffleNRepeatPerShuffle, CDEShuffleBlockTransferClusterLengths_MBlock_MPerBlock_NBlock_NPerBlock, CDEShuffleBlockTransferScalarPerVectors, BlkGemmPipeSched, BlkGemmPipelineVer, ComputeTypeA, ComputeTypeB, PermuteA, PermuteB > GridwiseGemm
Definition device_gemm_multiple_d_wmma_cshuffle_v3.hpp:191
Definition device_gemm_multiple_d.hpp:80