arch.hpp Source File#
arch.hpp
Go to the documentation of this file.
96CK_TILE_DEVICE index_t get_thread_global_1d_id() { return blockIdx.x * blockDim.x + threadIdx.x; }
Definition arch.hpp:385
Definition tile/core/algorithm/cluster_descriptor.hpp:13
typename safe_underlying_type< T, std::is_enum< T >::value >::type safe_underlying_type_t
Definition arch.hpp:43
CK_TILE_DEVICE void atomic_add(X *p_dst, const X &x)
__device__ uint32_t amd_wave_read_first_lane(uint16_t v)
Definition tile/core/arch/amd_buffer_addressing.hpp:35
constant< b > bool_constant
Definition tile/core/numeric/integral_constant.hpp:43
CK_TILE_DEVICE index_t get_warp_id(bool_constant< ReturnSgpr >={})
Definition arch.hpp:104
CK_TILE_DEVICE void block_sync_lds_direct_load()
Definition arch.hpp:288
CK_TILE_HOST_DEVICE T add(const T &a, const T &b)
Definition tile/core/arch/generic_memory_space_atomic.hpp:16
CK_TILE_HOST_DEVICE constexpr index_t get_smem_capacity()
Definition arch.hpp:328
CK_TILE_DEVICE index_t get_thread_local_1d_id()
Definition arch.hpp:94
__device__ T * cast_pointer_to_generic_address_space(T CK_CONSTANT_ADDRESS_SPACE *p)
Definition arch.hpp:307
CK_TILE_DEVICE index_t get_thread_global_1d_id()
Definition arch.hpp:96
__host__ __device__ T CK_CONSTANT_ADDRESS_SPACE * cast_pointer_to_constant_address_space(T *p)
Definition arch.hpp:318
CK_TILE_DEVICE void block_sync_load_raw(index_t cnt=0)
Definition arch.hpp:121
CK_TILE_HOST_DEVICE constexpr const char * address_space_to_string(address_space_enum addr_space)
Helper function to convert address space enum to string.
Definition arch.hpp:338
Definition arch.hpp:151
static CK_TILE_DEVICE constexpr index_t pack_lgkm(index_t c)
Definition arch.hpp:157
static CK_TILE_DEVICE constexpr index_t LGKM_MASK
Definition arch.hpp:153
static CK_TILE_DEVICE constexpr index_t pack_exp(index_t)
Definition arch.hpp:158
static CK_TILE_DEVICE constexpr index_t VM_MASK
Definition arch.hpp:152
static CK_TILE_DEVICE constexpr bool HAS_EXP
Definition arch.hpp:154
static CK_TILE_DEVICE constexpr index_t pack_vm(index_t c)
Definition arch.hpp:156
Definition arch.hpp:140
static CK_TILE_DEVICE constexpr index_t VM_MASK
Definition arch.hpp:141
static CK_TILE_DEVICE constexpr index_t pack_vm(index_t c)
Definition arch.hpp:145
static CK_TILE_DEVICE constexpr index_t pack_lgkm(index_t c)
Definition arch.hpp:146
static CK_TILE_DEVICE constexpr index_t pack_exp(index_t)
Definition arch.hpp:147
static CK_TILE_DEVICE constexpr index_t LGKM_MASK
Definition arch.hpp:142
static CK_TILE_DEVICE constexpr bool HAS_EXP
Definition arch.hpp:143
Definition arch.hpp:162
static CK_TILE_DEVICE constexpr bool HAS_EXP
Definition arch.hpp:166
static CK_TILE_DEVICE constexpr index_t pack_lgkm(index_t c)
Definition arch.hpp:173
static CK_TILE_DEVICE constexpr index_t pack_vm(index_t c)
Definition arch.hpp:168
static CK_TILE_DEVICE constexpr index_t EXP_MASK
Definition arch.hpp:165
static CK_TILE_DEVICE constexpr index_t LGKM_MASK
Definition arch.hpp:164
static CK_TILE_DEVICE constexpr index_t VM_MASK
Definition arch.hpp:163
static CK_TILE_DEVICE constexpr index_t pack_exp(index_t c)
Definition arch.hpp:174
Definition tile/core/numeric/integral_constant.hpp:13
Definition arch.hpp:360
Definition arch.hpp:363
Definition arch.hpp:366
Definition arch.hpp:357
Definition arch.hpp:354
Definition arch.hpp:369
std::underlying_type_t< T > type
Definition arch.hpp:33
Definition arch.hpp:28
Definition arch.hpp:190
static CK_TILE_DEVICE constexpr index_t from_lgkmcnt()
Definition arch.hpp:210
static CK_TILE_DEVICE constexpr index_t kMaxVmCnt
Definition arch.hpp:197
static CK_TILE_DEVICE constexpr index_t from_vmcnt()
Definition arch.hpp:203
static CK_TILE_DEVICE constexpr index_t from_expcnt()
Definition arch.hpp:217
static CK_TILE_DEVICE constexpr index_t kMaxExpCnt
Definition arch.hpp:199
static CK_TILE_DEVICE constexpr index_t kMaxLgkmCnt
Definition arch.hpp:198