clang 20.0.0git
Macros | Functions
nvptxintrin.h File Reference
#include <stdint.h>

Go to the source code of this file.

Macros

#define bool   _Bool
 
#define __gpu_private   __attribute__((address_space(5)))
 
#define __gpu_constant   __attribute__((address_space(4)))
 
#define __gpu_local   __attribute__((address_space(3)))
 
#define __gpu_global   __attribute__((address_space(1)))
 
#define __gpu_generic   __attribute__((address_space(0)))
 
#define __gpu_kernel   __attribute__((nvptx_kernel, visibility("protected")))
 

Functions

 _Pragma ("push_macro(\"bool\")")
 
 _Pragma ("omp begin declare target device_type(nohost)")
 
 _Pragma ("omp begin declare variant match(device = {arch(nvptx64)})")
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_blocks_x (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_blocks_y (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_blocks_z (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_block_id_x (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_block_id_y (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_block_id_z (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_threads_x (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_threads_y (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_threads_z (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_thread_id_x (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_thread_id_y (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_thread_id_z (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_lanes (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_lane_id (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_lane_mask (void)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_read_first_lane_u32 (uint64_t __lane_mask, uint32_t __x)
 
static _DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_read_first_lane_u64 (uint64_t __lane_mask, uint64_t __x)
 
static _DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_ballot (uint64_t __lane_mask, bool __x)
 
static _DEFAULT_FN_ATTRS __inline__ void __gpu_sync_threads (void)
 
static _DEFAULT_FN_ATTRS __inline__ void __gpu_sync_lane (uint64_t __lane_mask)
 
static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_shuffle_idx_u32 (uint64_t __lane_mask, uint32_t __idx, uint32_t __x)
 
static _DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_shuffle_idx_u64 (uint64_t __lane_mask, uint32_t __idx, uint64_t __x)
 
static _DEFAULT_FN_ATTRS __inline__ bool __gpu_is_ptr_local (void *ptr)
 
static _DEFAULT_FN_ATTRS __inline__ bool __gpu_is_ptr_private (void *ptr)
 
static _DEFAULT_FN_ATTRS __inline__ void __gpu_exit (void)
 
static _DEFAULT_FN_ATTRS __inline__ void __gpu_thread_suspend (void)
 
 _Pragma ("omp end declare variant")
 
 _Pragma ("omp end declare target")
 
 _Pragma ("pop_macro(\"bool\")")
 

Macro Definition Documentation

◆ __gpu_constant

#define __gpu_constant   __attribute__((address_space(4)))

Definition at line 28 of file nvptxintrin.h.

◆ __gpu_generic

#define __gpu_generic   __attribute__((address_space(0)))

Definition at line 31 of file nvptxintrin.h.

◆ __gpu_global

#define __gpu_global   __attribute__((address_space(1)))

Definition at line 30 of file nvptxintrin.h.

◆ __gpu_kernel

#define __gpu_kernel   __attribute__((nvptx_kernel, visibility("protected")))

Definition at line 34 of file nvptxintrin.h.

◆ __gpu_local

#define __gpu_local   __attribute__((address_space(3)))

Definition at line 29 of file nvptxintrin.h.

◆ __gpu_private

#define __gpu_private   __attribute__((address_space(5)))

Definition at line 27 of file nvptxintrin.h.

◆ bool

#define bool   _Bool

Definition at line 20 of file nvptxintrin.h.

Function Documentation

◆ __gpu_ballot()

static _DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_ballot ( uint64_t  __lane_mask,
bool  __x 
)
static

Definition at line 134 of file nvptxintrin.h.

◆ __gpu_block_id_x()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_block_id_x ( void  )
static

Definition at line 52 of file nvptxintrin.h.

◆ __gpu_block_id_y()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_block_id_y ( void  )
static

Definition at line 57 of file nvptxintrin.h.

◆ __gpu_block_id_z()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_block_id_z ( void  )
static

Definition at line 62 of file nvptxintrin.h.

◆ __gpu_exit()

static _DEFAULT_FN_ATTRS __inline__ void __gpu_exit ( void  )
static

Definition at line 184 of file nvptxintrin.h.

◆ __gpu_is_ptr_local()

static _DEFAULT_FN_ATTRS __inline__ bool __gpu_is_ptr_local ( void *  ptr)
static

Definition at line 174 of file nvptxintrin.h.

◆ __gpu_is_ptr_private()

static _DEFAULT_FN_ATTRS __inline__ bool __gpu_is_ptr_private ( void *  ptr)
static

Definition at line 179 of file nvptxintrin.h.

◆ __gpu_lane_id()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_lane_id ( void  )
static

Definition at line 102 of file nvptxintrin.h.

◆ __gpu_lane_mask()

static _DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_lane_mask ( void  )
static

Definition at line 107 of file nvptxintrin.h.

◆ __gpu_num_blocks_x()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_blocks_x ( void  )
static

Definition at line 37 of file nvptxintrin.h.

◆ __gpu_num_blocks_y()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_blocks_y ( void  )
static

Definition at line 42 of file nvptxintrin.h.

◆ __gpu_num_blocks_z()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_blocks_z ( void  )
static

Definition at line 47 of file nvptxintrin.h.

◆ __gpu_num_lanes()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_lanes ( void  )
static

◆ __gpu_num_threads_x()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_threads_x ( void  )
static

Definition at line 67 of file nvptxintrin.h.

◆ __gpu_num_threads_y()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_threads_y ( void  )
static

Definition at line 72 of file nvptxintrin.h.

◆ __gpu_num_threads_z()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_num_threads_z ( void  )
static

Definition at line 77 of file nvptxintrin.h.

◆ __gpu_read_first_lane_u32()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_read_first_lane_u32 ( uint64_t  __lane_mask,
uint32_t  __x 
)
static

Definition at line 113 of file nvptxintrin.h.

References __gpu_num_lanes().

◆ __gpu_read_first_lane_u64()

static _DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_read_first_lane_u64 ( uint64_t  __lane_mask,
uint64_t  __x 
)
static

Definition at line 121 of file nvptxintrin.h.

References __gpu_num_lanes().

◆ __gpu_shuffle_idx_u32()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_shuffle_idx_u32 ( uint64_t  __lane_mask,
uint32_t  __idx,
uint32_t  __x 
)
static

Definition at line 152 of file nvptxintrin.h.

References __gpu_num_lanes().

◆ __gpu_shuffle_idx_u64()

static _DEFAULT_FN_ATTRS __inline__ uint64_t __gpu_shuffle_idx_u64 ( uint64_t  __lane_mask,
uint32_t  __idx,
uint64_t  __x 
)
static

Definition at line 161 of file nvptxintrin.h.

References __gpu_num_lanes().

◆ __gpu_sync_lane()

static _DEFAULT_FN_ATTRS __inline__ void __gpu_sync_lane ( uint64_t  __lane_mask)
static

Definition at line 146 of file nvptxintrin.h.

◆ __gpu_sync_threads()

static _DEFAULT_FN_ATTRS __inline__ void __gpu_sync_threads ( void  )
static

Definition at line 141 of file nvptxintrin.h.

◆ __gpu_thread_id_x()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_thread_id_x ( void  )
static

Definition at line 82 of file nvptxintrin.h.

◆ __gpu_thread_id_y()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_thread_id_y ( void  )
static

Definition at line 87 of file nvptxintrin.h.

◆ __gpu_thread_id_z()

static _DEFAULT_FN_ATTRS __inline__ uint32_t __gpu_thread_id_z ( void  )
static

Definition at line 92 of file nvptxintrin.h.

◆ __gpu_thread_suspend()

static _DEFAULT_FN_ATTRS __inline__ void __gpu_thread_suspend ( void  )
static

Definition at line 189 of file nvptxintrin.h.

◆ _Pragma() [1/6]

_Pragma ( "omp begin declare target device_type(nohost)"  )

◆ _Pragma() [2/6]

_Pragma ( "omp begin declare variant match(device = {arch(nvptx64)})"  )

◆ _Pragma() [3/6]

_Pragma ( "omp end declare target"  )

◆ _Pragma() [4/6]

_Pragma ( "omp end declare variant"  )

◆ _Pragma() [5/6]

_Pragma ( "pop_macro(\"bool\")"  )

◆ _Pragma() [6/6]

_Pragma ( "push_macro(\"bool\")"  )