batched_transpose_lds_pipeline.hpp Source File#
batched_transpose_lds_pipeline.hpp
Go to the documentation of this file.
Definition tile/core/algorithm/cluster_descriptor.hpp:13
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition type_traits.hpp:21
CK_TILE_HOST_DEVICE constexpr auto make_tensor_view(DataType *__restrict__ p, const tensor_descriptor< Ts... > &desc)
Definition tensor_view.hpp:452
CK_TILE_DEVICE auto load_tile_transpose(const tile_window_with_static_distribution< BottomTensorView_, WindowLengths_, TileDistribution_, NumCoord > &tile_window)
transpose loads tile from a tensor and returns the resulting tensor with a new (transposed) tile dist...
Definition load_tile_transpose.hpp:403
CK_TILE_DEVICE constexpr auto make_tile_window(null_tensor_view, const WindowLengths &window_lengths, const multi_index< WindowLengths::size()> &, Ts &&...)
Definition null_tile_window.hpp:75
CK_TILE_DEVICE void store_tile(tile_window_with_static_lengths< BottomTensorView_, WindowLengths_ > &tile_window_tmp, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor)
Definition store_tile.hpp:23
CK_TILE_DEVICE auto load_tile(const TileWindow_ &tile_window, number< i_access >={}, bool_constant< oob_conditional_check >={})
Definition load_tile.hpp:22
CK_TILE_HOST_DEVICE constexpr auto make_tuple(Xs &&... xs)
Definition tile/core/container/tuple.hpp:360
Definition batched_transpose_lds_pipeline.hpp:10
CK_TILE_DEVICE void operator()(const InputTileWindow &input_window, OutputTileWindow &output_window)
Definition batched_transpose_lds_pipeline.hpp:28
static constexpr index_t kLeadSizePerBlock
Definition batched_transpose_lds_pipeline.hpp:17
remove_cvref_t< typename Problem::DataType > DataType
Definition batched_transpose_lds_pipeline.hpp:14
static constexpr index_t GetVectorSize()
Definition batched_transpose_lds_pipeline.hpp:20
remove_cvref_t< Problem_ > Problem
Definition batched_transpose_lds_pipeline.hpp:11
static constexpr index_t kBlockSize
Definition batched_transpose_lds_pipeline.hpp:16
remove_cvref_t< Policy_ > Policy
Definition batched_transpose_lds_pipeline.hpp:12
static CK_TILE_DEVICE constexpr index_t GetSmemSize()
Definition batched_transpose_lds_pipeline.hpp:22
static constexpr index_t kSecondSizePerBlock
Definition batched_transpose_lds_pipeline.hpp:18