elementwise_kernel.hpp Source File#
elementwise_kernel.hpp
Go to the documentation of this file.
Definition tile/core/algorithm/cluster_descriptor.hpp:13
constexpr decltype(auto) apply(F &&f, Tuple &&t)
Definition tile/core/container/tuple.hpp:526
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition type_traits.hpp:21
CK_TILE_HOST_DEVICE constexpr auto make_naive_tensor_view(DataType *__restrict__ p, const tuple< Lengths... > &lengths, const tuple< Strides... > &strides, number< GuaranteedLastDimensionVectorLength >=number<-1 >{}, number< GuaranteedLastDimensionVectorStride >=number<-1 >{})
Definition tensor_view.hpp:471
CK_TILE_HOST_DEVICE constexpr auto make_merge_transform(const LowLengths &low_lengths)
Definition coordinate_transform.hpp:1615
typename __make_integer_seq< impl::__integer_sequence, index_t, N >::seq_type make_index_sequence
Definition tile/core/container/sequence.hpp:230
CK_TILE_HOST_DEVICE constexpr auto make_static_distributed_tensor(const StaticTileDistribution &)
Definition static_distributed_tensor.hpp:142
CK_TILE_DEVICE constexpr auto make_tile_window(null_tensor_view, const WindowLengths &window_lengths, const multi_index< WindowLengths::size()> &, Ts &&...)
Definition null_tile_window.hpp:75
CK_TILE_DEVICE auto cast_tile(const SrcTensor &src_tensor)
Definition tile_elementwise.hpp:327
CK_TILE_HOST_DEVICE constexpr auto generate_tuple(F &&f, number< N >)
Definition tile/core/container/tuple.hpp:429
CK_TILE_HOST_DEVICE constexpr auto pad_tensor_view(const TensorView &tensor_view, const TileLengths &tile_lengths, DoPads)
Definition tensor_view.hpp:530
CK_TILE_DEVICE void sweep_tile_span(TileDistributedSpan_, const F &f)
Definition sweep_tile.hpp:20
CK_TILE_DEVICE void store_tile(tile_window_with_static_lengths< BottomTensorView_, WindowLengths_ > &tile_window_tmp, const static_distributed_tensor< DataType_, TileDistribution_ > &dstr_tensor)
Definition store_tile.hpp:23
CK_TILE_HOST_DEVICE constexpr auto transform_tensor_view(const OldTensorView &old_tensor_view, const NewTransforms &new_transforms, NewLowerDimensionOldVisibleIdss, NewUpperDimensionNewVisibleIdss)
Definition tensor_view.hpp:511
CK_TILE_HOST_DEVICE constexpr Y type_convert(X x)
Definition tile/core/numeric/type_convert.hpp:29
CK_TILE_DEVICE auto load_tile(const TileWindow_ &tile_window, number< i_access >={}, bool_constant< oob_conditional_check >={})
Definition load_tile.hpp:22
CK_TILE_HOST_DEVICE constexpr auto make_tuple(Xs &&... xs)
Definition tile/core/container/tuple.hpp:360
Definition elementwise_kernel.hpp:14
ck_tile::remove_cvref_t< Problem_ > Problem
Definition elementwise_kernel.hpp:15
ck_tile::remove_cvref_t< typename Problem::XDataType > XDataType
Definition elementwise_kernel.hpp:18
ck_tile::remove_cvref_t< Policy_ > Policy
Definition elementwise_kernel.hpp:16
ck_tile::remove_cvref_t< typename Problem::ElementWiseOperation > ElementWiseOperation
Definition elementwise_kernel.hpp:21
CK_TILE_DEVICE void operator()(const Dims lens, const Dims input_strides, const Dims output_strides, const tuple< XDataType... > &input_tensors, YDataType *p_y) const
Definition elementwise_kernel.hpp:30
static constexpr index_t kBlockSize
Definition elementwise_kernel.hpp:23
static CK_TILE_HOST constexpr auto BlockSize()
Definition elementwise_kernel.hpp:24
static CK_TILE_HOST bool IsSupportedArgument(const ck_tile::tuple< Ints... > &input_sizes)
Definition elementwise_kernel.hpp:105
ck_tile::remove_cvref_t< typename Problem::YDataType > YDataType
Definition elementwise_kernel.hpp:20
ck_tile::remove_cvref_t< typename Problem::ComputeDataType > ComputeDataType
Definition elementwise_kernel.hpp:19
Definition tile/core/container/sequence.hpp:49
Definition tensor_view.hpp:41
Definition tile/core/container/tuple.hpp:192
CK_TILE_HOST_DEVICE constexpr decltype(auto) get() const &
Definition tile/core/container/tuple.hpp:269