/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-composable-kernel/checkouts/develop/include/ck_tile/core/tensor/static_distributed_tensor.hpp Source File#
static_distributed_tensor.hpp
Go to the documentation of this file.
142 CK_TILE_HOST_DEVICE constexpr auto make_static_distributed_tensor(const StaticTileDistribution&)
149 CK_TILE_HOST_DEVICE constexpr auto make_static_distributed_tensor(const StaticTileDistribution&,
constexpr bool is_similiar_distributed_tensor_v
Definition: static_distributed_tensor.hpp:230
CK_TILE_HOST_DEVICE auto get_partition_index(Distribution)
Definition: tile_distribution.hpp:22
Definition: cluster_descriptor.hpp:13
constexpr CK_TILE_HOST_DEVICE auto to_array(const std::vector< X > &x)
Definition: array.hpp:286
constexpr CK_TILE_HOST_DEVICE auto make_tensor_adaptor_coordinate(const Adaptor &adaptor, const TopIndex &idx_top)
Definition: tensor_adaptor_coordinate.hpp:55
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition: type_traits.hpp:21
constexpr CK_TILE_HOST_DEVICE index_t reduce_on_sequence(Seq, Reduce f, number< Init >)
Definition: sequence.hpp:979
constexpr CK_TILE_HOST_DEVICE auto make_static_distributed_tensor(const StaticTileDistribution &)
Definition: static_distributed_tensor.hpp:142
constexpr CK_TILE_HOST_DEVICE auto make_naive_tensor_descriptor_packed(const tuple< Lengths... > &lengths, number< GuaranteedLastDimensionVectorLength >=number<-1 >{})
Definition: tensor_descriptor.hpp:365
CK_TILE_DEVICE void sweep_tile_span(TileDistributedSpan_, const F &f)
Definition: sweep_tile.hpp:20
CK_TILE_HOST_DEVICE void set_tile_if(static_distributed_tensor< DataType, StaticTileDistribution > &out_tensor, DataType value, XIndicesPredicate predicate)
Definition: static_distributed_tensor.hpp:175
constexpr CK_TILE_HOST_DEVICE auto make_tuple(Xs &&... xs)
Definition: tuple.hpp:360
constexpr CK_TILE_HOST_DEVICE auto get_y_unpacks_from_x_unpacks(YLengths, number< XUnpacks >)
Definition: static_distributed_tensor.hpp:197
constexpr CK_TILE_HOST_DEVICE auto get_x_indices_from_distributed_indices(StaticTileDistribution tile_distribution, DistributedIndices distributed_indices)
Definition: static_distributed_tensor.hpp:159
constexpr auto slice_sequence(Seq, number< SliceSize >, Mask=typename uniform_sequence_gen< Seq::size(), 1 >::type{})
Definition: sequence.hpp:1246
impl::is_static_impl< remove_cvref_t< T > > is_static
Definition: type_traits.hpp:87
constexpr CK_TILE_HOST_DEVICE auto container_concat(const X &x, const Ys &... ys)
Definition: container_helper.hpp:363
Definition: integral_constant.hpp:13
Definition: static_distributed_tensor.hpp:215
static constexpr bool value
Definition: static_distributed_tensor.hpp:216
Definition: math.hpp:98
Definition: numeric.hpp:81
Definition: sequence.hpp:49
Definition: static_distributed_tensor.hpp:21
static constexpr index_t kThreadElementSpaceSize
Definition: static_distributed_tensor.hpp:33
constexpr CK_TILE_HOST_DEVICE DataType & operator()(TileDistributedIndices)
Definition: static_distributed_tensor.hpp:126
remove_cvref_t< StaticTileDistribution_ > StaticTileDistribution
Definition: static_distributed_tensor.hpp:23
CK_TILE_HOST_DEVICE void set_y_sliced_thread_data(sequence< YSliceOrigins... >, sequence< YSliceLengths... >, const SlicedThreadData &sliced_thread_data)
Definition: static_distributed_tensor.hpp:93
CK_TILE_HOST_DEVICE auto get_y_sliced_thread_data(sequence< YSliceOrigins... >, sequence< YSliceLengths... >) const
Definition: static_distributed_tensor.hpp:68
thread_buffer< DataType, get_thread_buffer_size()> thread_buf_
Definition: static_distributed_tensor.hpp:138
static constexpr CK_TILE_HOST_DEVICE auto get_lengths()
Definition: static_distributed_tensor.hpp:41
remove_cvref_t< DataType_ > DataType
Definition: static_distributed_tensor.hpp:22
static constexpr CK_TILE_HOST_DEVICE auto get_tile_distribution()
Definition: static_distributed_tensor.hpp:46
static constexpr CK_TILE_HOST_DEVICE auto get_distributed_spans()
Definition: static_distributed_tensor.hpp:51
static constexpr index_t PackedSize
Definition: static_distributed_tensor.hpp:30
static constexpr CK_TILE_HOST_DEVICE auto get_num_of_dimension()
Definition: static_distributed_tensor.hpp:36
constexpr CK_TILE_HOST_DEVICE auto & get_thread_buffer()
Definition: static_distributed_tensor.hpp:60
static constexpr CK_TILE_HOST_DEVICE index_t get_thread_buffer_size()
Definition: static_distributed_tensor.hpp:62
remove_cvref_t< decltype(StaticTileDistribution{}.get_ys_to_d_descriptor())> ThreadTensorDesc
Definition: static_distributed_tensor.hpp:29
constexpr CK_TILE_HOST_DEVICE const DataType & operator[](TileDistributedIndices) const
Definition: static_distributed_tensor.hpp:114
constexpr CK_TILE_HOST_DEVICE const auto & get_thread_buffer() const
Definition: static_distributed_tensor.hpp:58
CK_TILE_HOST_DEVICE void initialize(const DataType &x)
Definition: static_distributed_tensor.hpp:56
Definition: functional.hpp:141
Definition: debug.hpp:67
Definition: tile_distribution.hpp:72
constexpr CK_TILE_HOST_DEVICE const auto & get_ps_ys_to_xs_adaptor() const
Definition: tile_distribution.hpp:126
static constexpr CK_TILE_HOST_DEVICE auto get_y_indices_from_distributed_indices(DistributedIndices)
Definition: tile_distribution.hpp:205