#include <block_fmha_bwd_dq_dk_dv_pipeline_kr_ktr_vr_iglp.hpp>
|
| template<typename QDramBlockWindowTmp, typename KDramBlockWindowTmp, typename VDramBlockWindowTmp, typename BiasDramBlockWindowTmp, typename RandValDramBlockWindowTmp, typename OGradDramBlockWindowTmp, typename LSEDramBlockWindowTmp, typename DDramBlockWindowTmp, typename QGradDramBlockWindowTmp, typename BiasGradDramBlockWindowTmp, typename PositionEncoding> |
| CK_TILE_HOST_DEVICE auto | operator() (void *smem_ptr, const QDramBlockWindowTmp &q_dram_block_window_tmp, const KDramBlockWindowTmp &k_dram_block_window_tmp, const VDramBlockWindowTmp &v_dram_block_window_tmp, const BiasDramBlockWindowTmp &bias_dram_block_window_tmp, const RandValDramBlockWindowTmp &randval_dram_block_window_tmp, const OGradDramBlockWindowTmp &do_dram_block_window_tmp, const LSEDramBlockWindowTmp &lse_dram_block_window_tmp, const DDramBlockWindowTmp &d_dram_block_window_tmp, const QGradDramBlockWindowTmp &dq_dram_block_window_tmp, const BiasGradDramBlockWindowTmp &dbias_dram_block_window_tmp, FmhaMask mask, PositionEncoding position_encoding, float raw_scale, float scale, float rp_undrop, float scale_rp_undrop, FmhaDropout &dropout) const |
◆ AccDataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ BiasDataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ BiasGradDataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ BlockFmhaShape
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ DDataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ FmhaDropout
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ FmhaMask
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ GemmDataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ HotLoopScheduler
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ KDataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ KGradDataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ LSEDataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ ODataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ OGradDataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ QDataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ QGradDataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ RandValOutputDataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ VDataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ VGradDataType
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ GetSmemSize()
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ operator()()
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
template<typename QDramBlockWindowTmp, typename KDramBlockWindowTmp, typename VDramBlockWindowTmp, typename BiasDramBlockWindowTmp, typename RandValDramBlockWindowTmp, typename OGradDramBlockWindowTmp, typename LSEDramBlockWindowTmp, typename DDramBlockWindowTmp, typename QGradDramBlockWindowTmp, typename BiasGradDramBlockWindowTmp, typename PositionEncoding>
| CK_TILE_HOST_DEVICE auto ck_tile::BlockFmhaBwdDQDKDVPipelineKRKTRVRIGLP< Problem, Policy >::operator() |
( |
void * | smem_ptr, |
|
|
const QDramBlockWindowTmp & | q_dram_block_window_tmp, |
|
|
const KDramBlockWindowTmp & | k_dram_block_window_tmp, |
|
|
const VDramBlockWindowTmp & | v_dram_block_window_tmp, |
|
|
const BiasDramBlockWindowTmp & | bias_dram_block_window_tmp, |
|
|
const RandValDramBlockWindowTmp & | randval_dram_block_window_tmp, |
|
|
const OGradDramBlockWindowTmp & | do_dram_block_window_tmp, |
|
|
const LSEDramBlockWindowTmp & | lse_dram_block_window_tmp, |
|
|
const DDramBlockWindowTmp & | d_dram_block_window_tmp, |
|
|
const QGradDramBlockWindowTmp & | dq_dram_block_window_tmp, |
|
|
const BiasGradDramBlockWindowTmp & | dbias_dram_block_window_tmp, |
|
|
FmhaMask | mask, |
|
|
PositionEncoding | position_encoding, |
|
|
float | raw_scale, |
|
|
float | scale, |
|
|
float | rp_undrop, |
|
|
float | scale_rp_undrop, |
|
|
FmhaDropout & | dropout ) const |
|
inline |
◆ BiasEnum
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kAlignmentBias
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kAlignmentK
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
Initial value:=
static constexpr index_t kPadHeadDimQ
Definition block_fmha_bwd_dq_dk_dv_pipeline_kr_ktr_vr.hpp:52
◆ kAlignmentKGrad
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kAlignmentOGrad
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
Initial value:=
static constexpr bool kPadHeadDimV
Definition block_fmha_bwd_dot_do_o.hpp:24
◆ kAlignmentQ
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kAlignmentQGrad
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kAlignmentV
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
Initial value:=
static constexpr index_t kPadHeadDimV
Definition block_fmha_bwd_dq_dk_dv_pipeline_kr_ktr_vr.hpp:53
◆ kAlignmentVGrad
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kBlockPerCu
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kBlockSize
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kHasBiasGrad
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kIsDeterministic
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kIsGroupMode
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kK0
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kK1
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kK2
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kK3
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kK4
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kM0
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kN0
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kPadHeadDimQ
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kPadHeadDimV
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kQKHeaddim
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kUseTrLoad
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ kVHeaddim
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
◆ name
template<typename Problem, typename Policy = BlockFmhaBwdPipelineDefaultPolicy>
The documentation for this struct was generated from the following file: