LogitsSoftCap< UseExp2 > Struct Template Reference

LogitsSoftCap&lt; UseExp2 &gt; Struct Template Reference#

Composable Kernel: ck_tile::LogitsSoftCap< UseExp2 > Struct Template Reference
ck_tile::LogitsSoftCap< UseExp2 > Struct Template Reference

#include <variants.hpp>

Public Member Functions

__device__ __host__ LogitsSoftCap ()=default
template<typename Params, typename T>
__device__ __forceinline__ T QueryTransform (const Params &params, T q) const
template<typename Params, typename T>
__device__ __forceinline__ T LogitsTransform (const Params &params, T logits, uint32_t batch_idx, uint32_t qo_head_idx, uint32_t kv_head_idx) const
template<typename Params>
__device__ __forceinline__ bool LogitsMask (const Params &params, uint32_t batch_idx, uint32_t qo_idx, uint32_t kv_idx, uint32_t qo_head_idx, uint32_t kv_head_idx) const

Constructor & Destructor Documentation

◆ LogitsSoftCap()

template<bool UseExp2 = false>
__device__ __host__ ck_tile::LogitsSoftCap< UseExp2 >::LogitsSoftCap ( )
default

Member Function Documentation

◆ LogitsMask()

template<bool UseExp2 = false>
template<typename Params>
__device__ __forceinline__ bool ck_tile::LogitsSoftCap< UseExp2 >::LogitsMask ( const Params & params,
uint32_t batch_idx,
uint32_t qo_idx,
uint32_t kv_idx,
uint32_t qo_head_idx,
uint32_t kv_head_idx ) const
inline

◆ LogitsTransform()

template<bool UseExp2 = false>
template<typename Params, typename T>
__device__ __forceinline__ T ck_tile::LogitsSoftCap< UseExp2 >::LogitsTransform ( const Params & params,
T logits,
uint32_t batch_idx,
uint32_t qo_head_idx,
uint32_t kv_head_idx ) const
inline

NOTICE: For better performance, we simpliy transform thread buffer without calculating qo_idx/kv_idx.

◆ QueryTransform()

template<bool UseExp2 = false>
template<typename Params, typename T>
__device__ __forceinline__ T ck_tile::LogitsSoftCap< UseExp2 >::QueryTransform ( const Params & params,
T q ) const
inline

The documentation for this struct was generated from the following file: