block_fmha_fwd_v3_pipeline.hpp File Reference

block_fmha_fwd_v3_pipeline.hpp File Reference#

Composable Kernel: block_fmha_fwd_v3_pipeline.hpp File Reference
block_fmha_fwd_v3_pipeline.hpp File Reference

Go to the source code of this file.

Classes

struct  ck_tile::CoreLoopScheduler< PipelineProblem, true >
struct  ck_tile::CoreLoopScheduler< PipelineProblem, false >
struct  ck_tile::BlockFmhaFwdV3Pipeline< Problem_, Policy_ >

Namespaces

namespace  ck_tile
namespace  ck_tile::detail

Macros

#define ENABLE_ASM_MARKER   1
#define ASM_MARKER(marker)
#define ADD_SBARRIER_FOR_PHASE0   1
#define CK_TILE_DISABLE_PACKED_FP32   0
#define WARP_ID   0
#define LANE_ID   0
#define ENABLE_DEBUG_STMTS   1
#define DEBUG_STMTS   if constexpr(false)

Functions

CK_TILE_DEVICE float ck_tile::detail::fma_impl_vsv (float a, float b, float c)
CK_TILE_DEVICE float ck_tile::detail::add_impl_vv (float lhs, float rhs)
CK_TILE_DEVICE float ck_tile::detail::mul_impl_vv (float lhs, float rhs)
CK_TILE_DEVICE fp16x2_t ck_tile::detail::cvt_pk_fp16_f32 (float a, float b)
CK_TILE_DEVICE bf16x2_t ck_tile::detail::cvt_pk_bf16_f32 (float a, float b)
CK_TILE_DEVICE fp32x2_t ck_tile::detail::pk_mul_f32 (fp32x2_t lhs, fp32x2_t rhs)

Macro Definition Documentation

◆ ADD_SBARRIER_FOR_PHASE0

#define ADD_SBARRIER_FOR_PHASE0   1

◆ ASM_MARKER

#define ASM_MARKER ( marker)

◆ CK_TILE_DISABLE_PACKED_FP32

#define CK_TILE_DISABLE_PACKED_FP32   0

◆ DEBUG_STMTS

#define DEBUG_STMTS   if constexpr(false)

◆ ENABLE_ASM_MARKER

#define ENABLE_ASM_MARKER   1

◆ ENABLE_DEBUG_STMTS

#define ENABLE_DEBUG_STMTS   1

◆ LANE_ID

#define LANE_ID   0

◆ WARP_ID

#define WARP_ID   0