Member List

Member List#

Composable Kernel: Member List
ck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize > Member List

This is the complete list of members for ck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >, including all inherited members.

BlockwiseReduce typedefck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >
BlockwiseWelford typedefck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >
I0ck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >static
I1ck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >static
K_BlockTileSizeck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >static
M_BlockTileSizeck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >static
PassThroughOp typedefck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >
reorder_thread_clusterck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >static
Run(const XYGridDesc_M_K &x_grid_desc_m_k, const XYGridDesc_M_K &dy_grid_desc_m_k, const MeanVarGridDesc_M &mean_var_grid_desc_m, const MeanVarCountGridDesc_M_K &mean_var_count_grid_desc_m_k, const DscaleDbiasGridDesc_M_G &dscale_dbias_grid_desc_m_g, index_t blkgroup_size, index_t num_xy_k_block_tile_iteration, index_t num_mean_var_count_k_block_tile_iteration, AccDataType epsilon, bool haveSavedMeanInvVar, const MeanVarDataType *const __restrict__ p_savedMean, const MeanVarDataType *const __restrict__ p_savedInvVar, const MeanVarDataType *const __restrict__ p_in_welford_mean, const MeanVarDataType *const __restrict__ p_in_welford_variance, const int32_t *const __restrict__ p_in_welford_count, const DyElementwiseOp dy_elementwise_op, MeanVarDataType *const __restrict__ p_out_welford_mean, MeanVarDataType *const __restrict__ p_out_welford_inv_variance, const XDataType *const __restrict__ p_x, const DyDataType *const __restrict__ p_dy, DscaleDbiasDataType *const __restrict__ p_reduce_dscale, DscaleDbiasDataType *const __restrict__ p_reduce_dbias)ck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >inlinestatic
thread_cluster_descck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >static
ThreadBufferDimAccessOrder typedefck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >
ThreadClusterArrangeOrder typedefck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >
ThreadClusterLengths_M_K typedefck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >
ThreadReduceDstDesc_M typedefck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >
ThreadReduceSrcDesc_M_1 typedefck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >
ThreadReduceSrcDesc_M_K typedefck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >
ThreadwiseReduce typedefck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >
ThreadwiseWelford typedefck::GridwiseWelfordSecondHalfReduceFirstHalf< XDataType, DyDataType, AccDataType, ScaleDataType, DscaleDbiasDataType, MeanVarDataType, DyElementwiseOp, XYGridDesc_M_K, MeanVarGridDesc_M, MeanVarCountGridDesc_M_K, DscaleDbiasGridDesc_M_G, BlockSize, MThreadClusterSize, KThreadClusterSize, MThreadSliceSize, KThreadSliceSize, XDyVectorDim, XSrcVectorSize, DySrcVectorSize, MeanVarSrcVectorSize >