gridwise_2d_reduction_threadwise.hpp File Reference

gridwise_2d_reduction_threadwise.hpp File Reference#

Composable Kernel: gridwise_2d_reduction_threadwise.hpp File Reference
gridwise_2d_reduction_threadwise.hpp File Reference

Go to the source code of this file.

Classes

struct  ck::GridwiseReduction_mk_to_m_threadwise< InDataType, OutDataType, AccDataType, IndexDataType, InGridDesc_M_K, OutGridDesc_M, ReduceOperation, InElementwiseOperation, AccElementwiseOperation, OutMemoryDataOperation, PropagateNan, BlockSize, MThreadSliceSize, KThreadSliceSize, InSrcVectorDim, InSrcVectorSize, OutDstVectorSize >

Namespaces

namespace  ck

Functions

template<typename GridwiseReduction, bool OutputIndex, bool TransformIndexKtoGlobal, bool HaveIndexInput, typename InDataType, typename OutDataType, typename AccDataType, typename IndexDataType, typename InGridDesc_M_K, typename OutGridDesc_M, typename InElementwiseOperation, typename AccElementwiseOperation>
__global__ void ck::kernel_reduce_threadwise (const InGridDesc_M_K in_grid_desc_m_k, const OutGridDesc_M out_grid_desc_m, const InElementwiseOperation in_elementwise_op, const AccElementwiseOperation acc_elementwise_op, AccDataType alpha, const InDataType *const __restrict__ p_in_value_global, const IndexDataType *const __restrict__ p_in_index_global, AccDataType beta, OutDataType *const __restrict__ p_out_value_global, IndexDataType *const __restrict__ p_out_index_global)