sweep_tile.hpp File Reference

sweep_tile.hpp File Reference#

Composable Kernel: sweep_tile.hpp File Reference
sweep_tile.hpp File Reference

Go to the source code of this file.

Classes

struct  ck_tile::impl::sweep_tile_impl< DistributedTensor, UnpacksPerXDim, sequence< I, Is... > >
struct  ck_tile::impl::sweep_tile_impl< DistributedTensor, UnpacksPerXDim, sequence<> >
struct  ck_tile::impl::sweep_tile_impl_0< DistributedTensor, UnpacksPerXDim, sequence< I, Is... > >
struct  ck_tile::tile_sweeper< DistributedTensor_, F_, UnpacksPerXDim_ >

Namespaces

namespace  ck_tile
namespace  ck_tile::impl

Functions

template<typename TileDistributedSpan_, typename F>
CK_TILE_DEVICE void ck_tile::sweep_tile_span (TileDistributedSpan_, const F &f)
template<typename TileDistributedSpan_, typename F, typename Unpacks = typename uniform_sequence_gen<TileDistributedSpan_::Impl::size(), 1>::type>
CK_TILE_DEVICE void ck_tile::sweep_tile_uspan (TileDistributedSpan_, const F &f, Unpacks={})
template<typename DistributedTensor, typename F, typename UnpacksPerXDim = typename uniform_sequence_gen<DistributedTensor::get_num_of_dimension(), 1>::type>
CK_TILE_HOST_DEVICE constexpr void ck_tile::sweep_tile (const F &f, UnpacksPerXDim={})
template<typename DistributedTensor, typename F, typename UnpacksPerXDim = typename uniform_sequence_gen<DistributedTensor::get_num_of_dimension(), 1>::type>
CK_TILE_HOST_DEVICE constexpr void ck_tile::sweep_tile (const DistributedTensor &, const F &f, UnpacksPerXDim={})
template<typename T, typename F, typename U = typename uniform_sequence_gen<T::get_num_of_dimension(), 1>::type>
CK_TILE_HOST_DEVICE_EXTERN ck_tile::tile_sweeper (const T &, const F &, U={}) -> tile_sweeper< T, F, U >