#include <dpp_gemm.hpp>
|
| __host__ __device__ constexpr | DppGemm () |
| template<class ADataType, class BDataType, class CDataType> |
| __device__ void | Run (const ADataType &p_a_wave, const BDataType &p_b_wave, CDataType &p_c_thread) const |
|
| static constexpr auto | I0 = Number<0>{} |
| static constexpr auto | I1 = Number<1>{} |
| static constexpr auto | I2 = Number<2>{} |
| static constexpr auto | I3 = Number<3>{} |
| static constexpr auto | I4 = Number<4>{} |
| static constexpr auto | I5 = Number<5>{} |
| static constexpr auto | dpp = DppSelector<BaseType, MPerDpp, NPerDpp>{} |
| static constexpr auto | dpp_instr = dpp.selected_dpp |
| static constexpr auto | K0PerDpp = 1 |
| static constexpr auto | K1PerDpp = dpp.GetK1PerDpp() |
◆ CIndex
◆ CIndex4D
◆ DppGemm()
| __host__ __device__ constexpr ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::DppGemm |
( |
| ) |
|
|
inlineconstexpr |
◆ CalculateAThreadOriginDataIndex_K_M()
| __host__ static __device__ auto ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::CalculateAThreadOriginDataIndex_K_M |
( |
| ) |
|
|
inlinestatic |
◆ CalculateBThreadOriginDataIndex_K_N()
| __host__ static __device__ auto ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::CalculateBThreadOriginDataIndex_K_N |
( |
| ) |
|
|
inlinestatic |
◆ GetBeginOfThreadBlk()
| __device__ CIndex ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::GetBeginOfThreadBlk |
( |
| ) |
|
|
inlinestatic |
◆ GetCMNThreadBlkLengths()
| __host__ static __device__ constexpr auto ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::GetCMNThreadBlkLengths |
( |
| ) |
|
|
inlinestaticconstexpr |
◆ GetDppOpIdx()
| __device__ auto ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::GetDppOpIdx |
( |
| ) |
|
|
inlinestatic |
◆ GetLaneGroupIdInWave()
| __device__ auto ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::GetLaneGroupIdInWave |
( |
| ) |
|
|
inlinestatic |
◆ GetLaneIdInLaneGroup()
| __device__ auto ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::GetLaneIdInLaneGroup |
( |
| ) |
|
|
inlinestatic |
◆ GetLaneIdInWave()
| __device__ auto ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::GetLaneIdInWave |
( |
| ) |
|
|
inlinestatic |
◆ GetRegSizePerDpp()
| __device__ constexpr index_t ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::GetRegSizePerDpp |
( |
| ) |
|
|
inlinestaticconstexpr |
◆ GetWaveId()
| __device__ auto ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::GetWaveId |
( |
| ) |
|
|
inlinestatic |
◆ Run()
template<class ADataType, class BDataType, class CDataType>
| __device__ void ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::Run |
( |
const ADataType & | p_a_wave, |
|
|
const BDataType & | p_b_wave, |
|
|
CDataType & | p_c_thread ) const |
|
inline |
◆ dpp
◆ dpp_instr
| auto ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::dpp_instr = dpp.selected_dpp |
|
staticconstexpr |
◆ I0
◆ I1
◆ I2
◆ I3
◆ I4
◆ I5
◆ K0PerDpp
| auto ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::K0PerDpp = 1 |
|
staticconstexpr |
◆ K1PerDpp
| auto ck::DppGemm< BaseType, MPerDpp, NPerDpp, KPack >::K1PerDpp = dpp.GetK1PerDpp() |
|
staticconstexpr |
The documentation for this struct was generated from the following file: