dynamic_quant_epilogue.hpp Source File#
dynamic_quant_epilogue.hpp
Go to the documentation of this file.
Definition tile/core/algorithm/cluster_descriptor.hpp:13
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition type_traits.hpp:21
CK_TILE_DEVICE auto tile_elementwise_in(const InElementFunc &in_element_func, const InTensor &... in_dstr_tensors)
Definition tile_elementwise.hpp:40
CK_TILE_HOST_DEVICE constexpr void sweep_tile(const F &f, UnpacksPerXDim={})
Definition sweep_tile.hpp:231
CK_TILE_DEVICE constexpr auto make_tile_window(null_tensor_view, const WindowLengths &window_lengths, const multi_index< WindowLengths::size()> &, Ts &&...)
Definition null_tile_window.hpp:75
CK_TILE_DEVICE auto cast_tile(const SrcTensor &src_tensor)
Definition tile_elementwise.hpp:327
CK_TILE_DEVICE void buffer_store_fence(index_t cnt=0)
Definition tile/core/arch/amd_buffer_addressing.hpp:1063
CK_TILE_DEVICE void store_tile_raw(tile_window_with_static_lengths< BottomTensorView_, WindowLengths_ > &tile_window_tmp, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor)
Definition store_tile.hpp:46
CK_TILE_DEVICE void store_tile(tile_window_with_static_lengths< BottomTensorView_, WindowLengths_ > &tile_window_tmp, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor)
Definition store_tile.hpp:23
CK_TILE_HOST_DEVICE constexpr auto make_static_tile_distribution(StaticTileDistributionEncoding_)
Definition tile_distribution.hpp:480
CK_TILE_HOST_DEVICE constexpr Y type_convert(X x)
Definition tile/core/numeric/type_convert.hpp:29
CK_TILE_DEVICE auto load_tile(const TileWindow_ &tile_window, number< i_access >={}, bool_constant< oob_conditional_check >={})
Definition load_tile.hpp:22
CK_TILE_HOST_DEVICE constexpr auto make_tuple(Xs &&... xs)
Definition tile/core/container/tuple.hpp:360
Definition block_reduce2d.hpp:334
Definition block_reduce2d.hpp:46
Definition block_reduce2d_problem.hpp:15
Definition block_reduce2d.hpp:224
Definition dynamic_quant_epilogue.hpp:45
static constexpr bool UseMax3
Definition dynamic_quant_epilogue.hpp:55
remove_cvref_t< typename Problem::BlockShape > BlockShape
Definition dynamic_quant_epilogue.hpp:51
remove_cvref_t< typename Problem::YScaleDataType > YScaleDataType
Definition dynamic_quant_epilogue.hpp:49
remove_cvref_t< typename Problem::ODataType > ODataType
Definition dynamic_quant_epilogue.hpp:50
static constexpr bool kPadM
Definition dynamic_quant_epilogue.hpp:52
remove_cvref_t< typename Problem::SmoothScaleDataType > SmoothScaleDataType
Definition dynamic_quant_epilogue.hpp:48
static CK_TILE_HOST_DEVICE constexpr auto GetBlockReduce2dCrossWarpSync()
Definition dynamic_quant_epilogue.hpp:69
static CK_TILE_HOST_DEVICE constexpr auto GetBlockReduce2dSync()
Definition dynamic_quant_epilogue.hpp:63
CK_TILE_DEVICE auto operator()(ODramWindowTmp &o_dram_window_tmp, YScaleWindow &y_scale_window, const OAccTile &o_acc_tile, void *smem)
Definition dynamic_quant_epilogue.hpp:204
remove_cvref_t< typename Problem::AccDataType > AccDataType
Definition dynamic_quant_epilogue.hpp:47
static constexpr bool kPadN
Definition dynamic_quant_epilogue.hpp:53
static constexpr bool UseRawStore
Definition dynamic_quant_epilogue.hpp:54
CK_TILE_DEVICE auto operator()(ODramWindowTmp &o_dram_window_tmp, const SmoothScaleWindow &sm_scale_window_, YScaleWindow &y_scale_window, const OAccTile &o_acc_tile, void *smem)
Definition dynamic_quant_epilogue.hpp:180
static CK_TILE_HOST_DEVICE constexpr auto GetBlockReduce2d()
Definition dynamic_quant_epilogue.hpp:57
remove_cvref_t< Problem > Problem
Definition dynamic_quant_epilogue.hpp:46
static CK_TILE_DEVICE constexpr auto MakeSmoothInputScaleTileDistribution()
Definition dynamic_quant_epilogue.hpp:75
static CK_TILE_HOST_DEVICE constexpr index_t GetSmemSize()
Definition dynamic_quant_epilogue.hpp:102
CK_TILE_DEVICE auto Impl(ODramWindowTmp &o_dram_window_tmp, YScaleWindow &y_scale_window, const OAccTile &o_acc_tile, void *smem)
Definition dynamic_quant_epilogue.hpp:109
Definition dynamic_quant_epilogue.hpp:33
remove_cvref_t< YScaleDataType_ > YScaleDataType
Definition dynamic_quant_epilogue.hpp:36
remove_cvref_t< ODataType_ > ODataType
Definition dynamic_quant_epilogue.hpp:37
remove_cvref_t< Traits_ > Traits
Definition dynamic_quant_epilogue.hpp:39
remove_cvref_t< BlockShape_ > BlockShape
Definition dynamic_quant_epilogue.hpp:38
remove_cvref_t< SmoothScaleDataType_ > SmoothScaleDataType
Definition dynamic_quant_epilogue.hpp:35
remove_cvref_t< AccDataType_ > AccDataType
Definition dynamic_quant_epilogue.hpp:34
Definition dynamic_quant_epilogue.hpp:17
static constexpr bool kPadM
Definition dynamic_quant_epilogue.hpp:18
static constexpr bool UseRawStore
Definition dynamic_quant_epilogue.hpp:21
static constexpr bool kPadN
Definition dynamic_quant_epilogue.hpp:19
static constexpr bool UseSmoothInputScale
Definition dynamic_quant_epilogue.hpp:20
static constexpr bool UseMax3
Definition dynamic_quant_epilogue.hpp:22
static CK_TILE_HOST_DEVICE constexpr T max()
Definition tile/core/numeric/numeric.hpp:26
Definition tile/core/container/sequence.hpp:49
Definition tile_distribution_encoding.hpp:26
Definition tile/core/container/tuple.hpp:192