add_rmsnorm2d_rdquant_fwd_kernel.hpp Source File#
add_rmsnorm2d_rdquant_fwd_kernel.hpp
Go to the documentation of this file.
130 _TS_(S_::Block_M) + "x" + _TS_(S_::Block_N) + "_" + _TS_(S_::WarpPerBlock_M) + "x" + _TS_(S_::WarpPerBlock_N) + "_" +
#define _TS_
#define _SS_
Definition tile/core/algorithm/cluster_descriptor.hpp:13
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition type_traits.hpp:21
CK_TILE_HOST_DEVICE constexpr auto make_naive_tensor_view(DataType *__restrict__ p, const tuple< Lengths... > &lengths, const tuple< Strides... > &strides, number< GuaranteedLastDimensionVectorLength >=number<-1 >{}, number< GuaranteedLastDimensionVectorStride >=number<-1 >{})
Definition tensor_view.hpp:471
CK_TILE_DEVICE constexpr auto make_tile_window(null_tensor_view, const WindowLengths &window_lengths, const multi_index< WindowLengths::size()> &, Ts &&...)
Definition null_tile_window.hpp:75
CK_TILE_HOST_DEVICE constexpr auto integer_divide_ceil(X x, Y y)
Definition tile/core/numeric/math.hpp:149
CK_TILE_HOST_DEVICE constexpr auto pad_tensor_view(const TensorView &tensor_view, const TileLengths &tile_lengths, DoPads)
Definition tensor_view.hpp:530
CK_TILE_DEVICE constexpr auto make_null_tile_window(const WindowLengths &window_lengths)
Definition null_tile_window.hpp:66
CK_TILE_HOST_DEVICE constexpr auto make_tuple(Xs &&... xs)
Definition tile/core/container/tuple.hpp:360
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:62
void * p_qy
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:69
index_t n
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:74
const void * p_b
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:64
void * p_yscale
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:68
const void * p_a
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:63
index_t stride
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:75
float epsilon
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:71
index_t m
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:73
const void * p_gamma
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:65
void * p_x
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:67
static constexpr const char * name
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:108
static constexpr const char * name
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:110
static constexpr const char * name
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:107
static constexpr const char * name
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:109
static constexpr const char * name
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:106
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:105
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:14
float epsilon
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:23
const void * p_a
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:15
void * p_x
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:19
const void * p_b
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:16
const void * p_gamma
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:17
index_t stride
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:27
void * p_yscale
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:20
void * p_qy
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:21
index_t m
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:25
index_t n
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:26
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:33
remove_cvref_t< typename Problem::ComputeDataType > ComputeDataType
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:40
static constexpr bool kPadN
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:50
static constexpr bool kThreePass
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:51
static constexpr bool kSaveX
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:45
static constexpr index_t Vector_N
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:54
remove_cvref_t< typename Problem::BDataType > BDataType
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:38
static constexpr index_t Block_M
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:47
CK_TILE_DEVICE void operator()(Kargs kargs) const
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:138
static CK_TILE_HOST std::string GetName()
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:116
static constexpr index_t Block_N
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:48
static constexpr auto I1
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:59
remove_cvref_t< typename Problem::ADataType > ADataType
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:37
static constexpr index_t kBlockSize
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:56
remove_cvref_t< Pipeline_ > Pipeline
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:34
static constexpr bool kPadM
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:49
typename Pipeline::Problem Problem
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:35
static CK_TILE_HOST constexpr Kargs MakeKargs(const Hargs &hargs)
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:79
static constexpr index_t Repeat_N
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:55
static CK_TILE_HOST constexpr auto BlockSize()
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:98
static CK_TILE_HOST constexpr auto GridSize(const Hargs &hargs)
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:93
static constexpr index_t ThreadPerWarp_N
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:53
static constexpr auto I0
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:58
AddRmsnorm2dRdquantFwdHostArgs Hargs
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:77
remove_cvref_t< typename Problem::YScaleDataType > YScaleDataType
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:42
remove_cvref_t< typename Problem::GammaDataType > GammaDataType
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:39
remove_cvref_t< typename Problem::QYDataType > QYDataType
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:43
remove_cvref_t< typename Problem::XDataType > XDataType
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:41
static CK_TILE_HOST_DEVICE constexpr index_t GetSmemSize()
Definition add_rmsnorm2d_rdquant_fwd_kernel.hpp:114
Definition tile/core/container/sequence.hpp:49