gemm_pipeline_agmem_bgmem_creg_v1.hpp Source File#
gemm_pipeline_agmem_bgmem_creg_v1.hpp
Go to the documentation of this file.
Definition tile/core/algorithm/cluster_descriptor.hpp:13
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition type_traits.hpp:21
CK_TILE_HOST_DEVICE constexpr auto make_tensor_view(DataType *__restrict__ p, const tensor_descriptor< Ts... > &desc)
Definition tensor_view.hpp:452
CK_TILE_DEVICE auto load_tile_with_elementwise(const TileWindow_ &tile_window, ElementWise_ elementwise, number< i_access >={}, bool_constant< oob_conditional_check >={})
Load tile with elementwise function.
Definition load_tile.hpp:41
typename detail::detector< nonesuch, void, Op, Args... >::value_t is_detected
Definition type_traits.hpp:67
CK_TILE_DEVICE void tile_elementwise_inout(const InOutElementFunc &inout_element_func, InOutDstrTensors &... inout_dstr_tensors)
Definition tile_elementwise.hpp:23
auto concat(const Ts &... xs) -> std::enable_if_t<!AllConvertibleToStringView< Ts... >, std::string >
Definition concat.hpp:43
CK_TILE_DEVICE void transpose_tile2d(OutTensor &out, const InTensor &in)
Definition transpose_tile.hpp:195
CK_TILE_HOST_DEVICE constexpr auto make_static_distributed_tensor(const StaticTileDistribution &)
Definition static_distributed_tensor.hpp:142
CK_TILE_DEVICE constexpr auto make_tile_window(null_tensor_view, const WindowLengths &window_lengths, const multi_index< WindowLengths::size()> &, Ts &&...)
Definition null_tile_window.hpp:75
CK_TILE_HOST_DEVICE constexpr auto generate_tuple(F &&f, number< N >)
Definition tile/core/container/tuple.hpp:429
CK_TILE_HOST_DEVICE constexpr auto integer_divide_ceil(X x, Y y)
Definition tile/core/numeric/math.hpp:149
CK_TILE_DEVICE void move_tile_window(null_tile_window< WindowLengths > &, const typename null_tile_window< WindowLengths >::BottomTensorIndex &)
Definition null_tile_window.hpp:95
CK_TILE_DEVICE void store_tile(tile_window_with_static_lengths< BottomTensorView_, WindowLengths_ > &tile_window_tmp, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor)
Definition store_tile.hpp:23
CK_TILE_HOST_DEVICE constexpr auto make_static_tile_distribution(StaticTileDistributionEncoding_)
Definition tile_distribution.hpp:480
CK_TILE_HOST_DEVICE constexpr auto make_tuple(Xs &&... xs)
Definition tile/core/container/tuple.hpp:360
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:17
static constexpr index_t kNPerBlock
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:45
number< 0 > I0
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:38
remove_cvref_t< std::tuple_element_t< 0, BsDataType > > BDataType
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:34
number< 1 > I1
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:39
remove_cvref_t< typename Problem::AsDataTypeTuple > AsDataType
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:18
static CK_TILE_HOST_DEVICE constexpr auto TransposeC()
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:86
remove_cvref_t< std::tuple_element_t< 0, AsLayout > > ALayout
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:30
static constexpr bool Preshuffle
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:67
static constexpr bool kPadN
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:64
static constexpr index_t kKPerBlock
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:46
static constexpr index_t kMPerBlock
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:44
static constexpr index_t BlockSize
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:42
remove_cvref_t< typename Problem::AsLayoutTuple > AsLayout
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:26
static constexpr index_t kLdsAlignmentInBytes
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:71
static constexpr index_t GetSmemPackA()
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:60
CK_TILE_DEVICE auto operator()(const AsDramBlockWindowTmp &a_dram_block_window_tmp, const BsDramBlockWindowTmp &b_dram_block_window_tmp, index_t num_loop, void *p_smem) const
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:320
remove_cvref_t< typename Problem::CDataType > CDataType
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:20
static CK_TILE_HOST_DEVICE constexpr index_t GetSmemSize()
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:88
remove_cvref_t< std::tuple_element_t< 0, BsLayout > > BLayout
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:31
static constexpr index_t GetVectorSizeC()
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:58
static constexpr index_t GetSmemPackB()
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:61
CK_TILE_DEVICE auto operator()(const ADramBlockWindowTmp &a_dram_block_window_tmp, const BDramBlockWindowTmp &b_dram_block_window_tmp, index_t num_loop, void *p_smem) const
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:339
number< 2 > I2
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:40
static constexpr index_t GetVectorSizeA()
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:49
remove_cvref_t< std::tuple_element_t< 0, AsDataType > > ADataType
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:33
CK_TILE_HOST_DEVICE auto operator()(const AsDramBlockWindowTmp &a_dram_block_window_tmp, const AElementFunction &a_element_func, const BsDramBlockWindowTmp &b_dram_block_window_tmp, const BElementFunction &b_element_func, index_t num_loop, void *p_smem) const
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:100
remove_cvref_t< typename Problem::BsLayoutTuple > BsLayout
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:27
static constexpr index_t NumWaveGroups
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:69
remove_cvref_t< typename Problem::CLayout > CLayout
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:28
static constexpr index_t GetVectorSizeB()
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:54
remove_cvref_t< typename Problem::BElementWise > BElementWise
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:23
static constexpr bool DoubleSmemBuffer
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:84
remove_cvref_t< decltype(Policy::template GetBlockGemm< Problem >())> BlockGemm
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:36
remove_cvref_t< typename Problem::BlockGemmShape > BlockGemmShape
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:24
static CK_TILE_HOST const std::string GetName()
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:73
static constexpr bool kPadK
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:65
static constexpr bool kPadM
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:63
remove_cvref_t< typename Problem::BsDataTypeTuple > BsDataType
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:19
remove_cvref_t< typename Problem::AElementWise > AElementWise
Definition gemm_pipeline_agmem_bgmem_creg_v1.hpp:22