clang 22.0.0git
amdgpuintrin.h File Reference

Go to the source code of this file.

Macros

#define __gpu_private   __attribute__((address_space(5)))
#define __gpu_constant   __attribute__((address_space(4)))
#define __gpu_local   __attribute__((address_space(3)))
#define __gpu_global   __attribute__((address_space(1)))
#define __gpu_generic   __attribute__((address_space(0)))
#define __gpu_kernel   __attribute__((amdgpu_kernel, visibility("protected")))

Functions

 _Pragma ("omp begin declare target device_type(nohost)")
 _Pragma ("omp begin declare variant match(device = {arch(amdgcn)})")
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_blocks_x (void)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_blocks_y (void)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_blocks_z (void)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_block_id_x (void)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_block_id_y (void)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_block_id_z (void)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_threads_x (void)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_threads_y (void)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_threads_z (void)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_thread_id_x (void)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_thread_id_y (void)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_thread_id_z (void)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_lanes (void)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_lane_id (void)
static _DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_lane_mask (void)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_read_first_lane_u32 (uint64_t __lane_mask, uint32_t __x)
static _DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_ballot (uint64_t __lane_mask, bool __x)
static _DEFAULT_FN_ATTRS __inline__ void __gpu_sync_threads (void)
static _DEFAULT_FN_ATTRS __inline__ void __gpu_sync_lane (uint64_t __lane_mask)
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_shuffle_idx_u32 (uint64_t __lane_mask, uint32_t __idx, uint32_t __x, uint32_t __width)
static _DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_match_any_u32 (uint64_t __lane_mask, uint32_t __x)
static _DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_match_any_u64 (uint64_t __lane_mask, uint64_t __x)
static _DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_match_all_u32 (uint64_t __lane_mask, uint32_t __x)
static _DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_match_all_u64 (uint64_t __lane_mask, uint64_t __x)
static _DEFAULT_FN_ATTRS __inline__ bool __gpu_is_ptr_local (void *ptr)
static _DEFAULT_FN_ATTRS __inline__ bool __gpu_is_ptr_private (void *ptr)
static _DEFAULT_FN_ATTRS __inline__ void __gpu_exit (void)
static _DEFAULT_FN_ATTRS __inline__ void __gpu_thread_suspend (void)
 _Pragma ("omp end declare variant")
 _Pragma ("omp end declare target")

Macro Definition Documentation

◆ __gpu_constant

#define __gpu_constant   __attribute__((address_space(4)))

Definition at line 25 of file amdgpuintrin.h.

◆ __gpu_generic

#define __gpu_generic   __attribute__((address_space(0)))

Definition at line 28 of file amdgpuintrin.h.

◆ __gpu_global

#define __gpu_global   __attribute__((address_space(1)))

Definition at line 27 of file amdgpuintrin.h.

◆ __gpu_kernel

#define __gpu_kernel   __attribute__((amdgpu_kernel, visibility("protected")))

Definition at line 31 of file amdgpuintrin.h.

◆ __gpu_local

#define __gpu_local   __attribute__((address_space(3)))

Definition at line 26 of file amdgpuintrin.h.

◆ __gpu_private

#define __gpu_private   __attribute__((address_space(5)))

Definition at line 24 of file amdgpuintrin.h.

Function Documentation

◆ __gpu_ballot()

_DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_ballot ( uint64_t __lane_mask,
bool __x )
static

◆ __gpu_block_id_x()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_block_id_x ( void )
static

Definition at line 49 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

Referenced by __gpu_block_id().

◆ __gpu_block_id_y()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_block_id_y ( void )
static

Definition at line 54 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

Referenced by __gpu_block_id().

◆ __gpu_block_id_z()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_block_id_z ( void )
static

Definition at line 59 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

Referenced by __gpu_block_id().

◆ __gpu_exit()

_DEFAULT_FN_ATTRS __inline__ void __gpu_exit ( void )
static

Definition at line 179 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS, and noreturn.

◆ __gpu_is_ptr_local()

_DEFAULT_FN_ATTRS __inline__ bool __gpu_is_ptr_local ( void * ptr)
static

Definition at line 167 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS, and clang::opencl_generic.

◆ __gpu_is_ptr_private()

_DEFAULT_FN_ATTRS __inline__ bool __gpu_is_ptr_private ( void * ptr)
static

Definition at line 173 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS, and clang::opencl_generic.

◆ __gpu_lane_id()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_lane_id ( void )
static

Definition at line 100 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

Referenced by __gpu_is_first_in_lane(), and __gpu_shuffle_idx_u32().

◆ __gpu_lane_mask()

_DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_lane_mask ( void )
static

◆ __gpu_match_all_u32()

_DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_match_all_u32 ( uint64_t __lane_mask,
uint32_t __x )
static

Definition at line 156 of file amdgpuintrin.h.

References __gpu_match_all_u32_impl().

◆ __gpu_match_all_u64()

_DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_match_all_u64 ( uint64_t __lane_mask,
uint64_t __x )
static

Definition at line 162 of file amdgpuintrin.h.

References __gpu_match_all_u64_impl().

◆ __gpu_match_any_u32()

_DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_match_any_u32 ( uint64_t __lane_mask,
uint32_t __x )
static

Definition at line 144 of file amdgpuintrin.h.

References __gpu_match_any_u32_impl().

◆ __gpu_match_any_u64()

_DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_match_any_u64 ( uint64_t __lane_mask,
uint64_t __x )
static

Definition at line 150 of file amdgpuintrin.h.

References __gpu_match_any_u64_impl().

◆ __gpu_num_blocks_x()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_blocks_x ( void )
static

Definition at line 34 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

Referenced by __gpu_num_blocks().

◆ __gpu_num_blocks_y()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_blocks_y ( void )
static

Definition at line 39 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

Referenced by __gpu_num_blocks().

◆ __gpu_num_blocks_z()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_blocks_z ( void )
static

Definition at line 44 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

Referenced by __gpu_num_blocks().

◆ __gpu_num_lanes()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_lanes ( void )
static

Definition at line 95 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

◆ __gpu_num_threads_x()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_threads_x ( void )
static

Definition at line 64 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

Referenced by __gpu_num_threads().

◆ __gpu_num_threads_y()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_threads_y ( void )
static

Definition at line 69 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

Referenced by __gpu_num_threads().

◆ __gpu_num_threads_z()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_threads_z ( void )
static

Definition at line 74 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

Referenced by __gpu_num_threads().

◆ __gpu_read_first_lane_u32()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_read_first_lane_u32 ( uint64_t __lane_mask,
uint32_t __x )
static

◆ __gpu_shuffle_idx_u32()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_shuffle_idx_u32 ( uint64_t __lane_mask,
uint32_t __idx,
uint32_t __x,
uint32_t __width )
static

Definition at line 136 of file amdgpuintrin.h.

References __gpu_lane_id().

Referenced by __gpu_shuffle_idx_f32(), and __gpu_shuffle_idx_u64().

◆ __gpu_sync_lane()

_DEFAULT_FN_ATTRS __inline__ void __gpu_sync_lane ( uint64_t __lane_mask)
static

◆ __gpu_sync_threads()

_DEFAULT_FN_ATTRS __inline__ void __gpu_sync_threads ( void )
static

Definition at line 124 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

◆ __gpu_thread_id_x()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_thread_id_x ( void )
static

Definition at line 79 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

Referenced by __gpu_thread_id().

◆ __gpu_thread_id_y()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_thread_id_y ( void )
static

Definition at line 84 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

Referenced by __gpu_thread_id().

◆ __gpu_thread_id_z()

_DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_thread_id_z ( void )
static

Definition at line 89 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

Referenced by __gpu_thread_id().

◆ __gpu_thread_suspend()

_DEFAULT_FN_ATTRS __inline__ void __gpu_thread_suspend ( void )
static

Definition at line 184 of file amdgpuintrin.h.

References _DEFAULT_FN_ATTRS.

◆ _Pragma() [1/4]

_Pragma ( "omp begin declare target device_type(nohost)" )

◆ _Pragma() [2/4]

_Pragma ( "omp begin declare variant match(device = {arch(amdgcn)})" )

◆ _Pragma() [3/4]

_Pragma ( "omp end declare target" )

◆ _Pragma() [4/4]

_Pragma ( "omp end declare variant" )