generic_permute_kernel.hpp Source File#
generic_permute_kernel.hpp
Go to the documentation of this file.
Definition tile/core/algorithm/cluster_descriptor.hpp:13
remove_cv_t< std::remove_reference_t< T > > remove_cvref_t
Definition type_traits.hpp:21
CK_TILE_HOST_DEVICE constexpr auto make_naive_tensor_view(DataType *__restrict__ p, const tuple< Lengths... > &lengths, const tuple< Strides... > &strides, number< GuaranteedLastDimensionVectorLength >=number<-1 >{}, number< GuaranteedLastDimensionVectorStride >=number<-1 >{})
Definition tensor_view.hpp:471
CK_TILE_HOST_DEVICE constexpr auto make_merge_transform(const LowLengths &low_lengths)
Definition coordinate_transform.hpp:1615
CK_TILE_HOST_DEVICE constexpr auto generate_tuple(F &&f, number< N >)
Definition tile/core/container/tuple.hpp:429
CK_TILE_HOST_DEVICE constexpr auto transform_tensor_view(const OldTensorView &old_tensor_view, const NewTransforms &new_transforms, NewLowerDimensionOldVisibleIdss, NewUpperDimensionNewVisibleIdss)
Definition tensor_view.hpp:511
CK_TILE_HOST_DEVICE constexpr auto make_tensor_coordinate(const TensorDesc &tensor_desc, const TopIndex &idx_top)
Definition tensor_coordinate.hpp:60
CK_TILE_HOST_DEVICE constexpr auto make_tuple(Xs &&... xs)
Definition tile/core/container/tuple.hpp:360
CK_TILE_HOST_DEVICE constexpr auto make_naive_tensor_view_packed(DataType *__restrict__ p, const tuple< Lengths... > &lengths, number< GuaranteedLastDimensionVectorLength >=number<-1 >{})
Definition tensor_view.hpp:494
Definition generic_permute_kernel.hpp:49
index_t perm_stride[kMaxRanks]
Definition generic_permute_kernel.hpp:55
index_t perm_length[kMaxRanks]
Definition generic_permute_kernel.hpp:54
index_t num_elements
Definition generic_permute_kernel.hpp:53
Definition generic_permute_kernel.hpp:15
index_t perm[kMaxRanks]
Definition generic_permute_kernel.hpp:22
index_t shape[kMaxRanks]
Definition generic_permute_kernel.hpp:21
static constexpr index_t kMaxRanks
Definition generic_permute_kernel.hpp:16
Definition generic_permute_kernel.hpp:40
static constexpr index_t kBlockSize
Definition generic_permute_kernel.hpp:44
static constexpr index_t kMaxRanks
Definition generic_permute_kernel.hpp:45
static CK_TILE_HOST constexpr Kargs MakeKargs(const GenericPermuteHostArgs &h)
Definition generic_permute_kernel.hpp:68
remove_cvref_t< typename Problem::DataType > DataType
Definition generic_permute_kernel.hpp:43
static CK_TILE_HOST constexpr index_t TotalElements(const GenericPermuteHostArgs &h)
Definition generic_permute_kernel.hpp:58
static constexpr bool KeepLastDim
Definition generic_permute_kernel.hpp:46
static CK_TILE_HOST constexpr auto GridSize(GenericPermuteHostArgs h)
Definition generic_permute_kernel.hpp:110
CK_TILE_DEVICE void operator()(Kargs kargs) const
Definition generic_permute_kernel.hpp:120
ck_tile::remove_cvref_t< Problem_ > Problem
Definition generic_permute_kernel.hpp:41
static CK_TILE_HOST_DEVICE constexpr auto BlockSize()
Definition generic_permute_kernel.hpp:118
typename std::conditional< kHasContent, type0, type1 >::type type
Definition tile/core/container/sequence.hpp:302
A fixed-size array container similar to std::array with additional utilities.
Definition tile/core/container/array.hpp:43
Definition tile/core/container/sequence.hpp:49
Definition tile/core/utility/debug.hpp:67