ThreadwiseContractionDl_A_TK0_TM0_TM1_TK1_B_TK0_TN0_TN1_TK1_C_TM0_TM1_TN0_TN1< FloatA, FloatB, FloatC, AThreadDesc_TK0_TM0_TM1_TK1, BThreadDesc_TK0_TN0_TN1_TK1, CThreadDesc_TM0_TM1_TN0_TN1, TKLengths, TMLengths, TNLengths, type > Struct Template Reference

ThreadwiseContractionDl_A_TK0_TM0_TM1_TK1_B_TK0_TN0_TN1_TK1_C_TM0_TM1_TN0_TN1&lt; FloatA, FloatB, FloatC, AThreadDesc_TK0_TM0_TM1_TK1, BThreadDesc_TK0_TN0_TN1_TK1, CThreadDesc_TM0_TM1_TN0_TN1, TKLengths, TMLengths, TNLengths, type &gt; Struct Template Reference#

Composable Kernel: ck::ThreadwiseContractionDl_A_TK0_TM0_TM1_TK1_B_TK0_TN0_TN1_TK1_C_TM0_TM1_TN0_TN1< FloatA, FloatB, FloatC, AThreadDesc_TK0_TM0_TM1_TK1, BThreadDesc_TK0_TN0_TN1_TK1, CThreadDesc_TM0_TM1_TN0_TN1, TKLengths, TMLengths, TNLengths, type > Struct Template Reference
ck::ThreadwiseContractionDl_A_TK0_TM0_TM1_TK1_B_TK0_TN0_TN1_TK1_C_TM0_TM1_TN0_TN1< FloatA, FloatB, FloatC, AThreadDesc_TK0_TM0_TM1_TK1, BThreadDesc_TK0_TN0_TN1_TK1, CThreadDesc_TM0_TM1_TN0_TN1, TKLengths, TMLengths, TNLengths, type > Struct Template Reference

#include <threadwise_contraction_dl.hpp>

Public Member Functions

__device__ constexpr ThreadwiseContractionDl_A_TK0_TM0_TM1_TK1_B_TK0_TN0_TN1_TK1_C_TM0_TM1_TN0_TN1 ()

Static Public Member Functions

template<typename ABuffer, typename AOriginIdx, typename BBuffer, typename BOriginIdx, typename CBuffer, typename COriginIdx>
static __device__ void Run (const ABuffer &a_buf, AOriginIdx, const BBuffer &b_buf, BOriginIdx, CBuffer &c_buf, COriginIdx)

Constructor & Destructor Documentation

◆ ThreadwiseContractionDl_A_TK0_TM0_TM1_TK1_B_TK0_TN0_TN1_TK1_C_TM0_TM1_TN0_TN1()

template<typename FloatA, typename FloatB, typename FloatC, typename AThreadDesc_TK0_TM0_TM1_TK1, typename BThreadDesc_TK0_TN0_TN1_TK1, typename CThreadDesc_TM0_TM1_TN0_TN1, typename TKLengths, typename TMLengths, typename TNLengths, typename enable_if< AThreadDesc_TK0_TM0_TM1_TK1::IsKnownAtCompileTime() &&BThreadDesc_TK0_TN0_TN1_TK1::IsKnownAtCompileTime() &&CThreadDesc_TM0_TM1_TN0_TN1::IsKnownAtCompileTime(), bool >::type = false>
__device__ constexpr ck::ThreadwiseContractionDl_A_TK0_TM0_TM1_TK1_B_TK0_TN0_TN1_TK1_C_TM0_TM1_TN0_TN1< FloatA, FloatB, FloatC, AThreadDesc_TK0_TM0_TM1_TK1, BThreadDesc_TK0_TN0_TN1_TK1, CThreadDesc_TM0_TM1_TN0_TN1, TKLengths, TMLengths, TNLengths, type >::ThreadwiseContractionDl_A_TK0_TM0_TM1_TK1_B_TK0_TN0_TN1_TK1_C_TM0_TM1_TN0_TN1 ( )
inlineconstexpr

Member Function Documentation

◆ Run()

template<typename FloatA, typename FloatB, typename FloatC, typename AThreadDesc_TK0_TM0_TM1_TK1, typename BThreadDesc_TK0_TN0_TN1_TK1, typename CThreadDesc_TM0_TM1_TN0_TN1, typename TKLengths, typename TMLengths, typename TNLengths, typename enable_if< AThreadDesc_TK0_TM0_TM1_TK1::IsKnownAtCompileTime() &&BThreadDesc_TK0_TN0_TN1_TK1::IsKnownAtCompileTime() &&CThreadDesc_TM0_TM1_TN0_TN1::IsKnownAtCompileTime(), bool >::type = false>
template<typename ABuffer, typename AOriginIdx, typename BBuffer, typename BOriginIdx, typename CBuffer, typename COriginIdx>
__device__ void ck::ThreadwiseContractionDl_A_TK0_TM0_TM1_TK1_B_TK0_TN0_TN1_TK1_C_TM0_TM1_TN0_TN1< FloatA, FloatB, FloatC, AThreadDesc_TK0_TM0_TM1_TK1, BThreadDesc_TK0_TN0_TN1_TK1, CThreadDesc_TM0_TM1_TN0_TN1, TKLengths, TMLengths, TNLengths, type >::Run ( const ABuffer & a_buf,
AOriginIdx ,
const BBuffer & b_buf,
BOriginIdx ,
CBuffer & c_buf,
COriginIdx  )
inlinestatic

The documentation for this struct was generated from the following file: