xref: /freebsd-src/contrib/llvm-project/llvm/lib/Target/NVPTX/cl_common_defines.h (revision 0b57cec536236d46e3dba9bd041533462f33dbb7)
1*0b57cec5SDimitry Andric #ifndef CL_COMMON_DEFINES_H
2*0b57cec5SDimitry Andric #define CL_COMMON_DEFINES_H
3*0b57cec5SDimitry Andric // This file includes defines that are common to both kernel code and
4*0b57cec5SDimitry Andric // the NVPTX back-end.
5*0b57cec5SDimitry Andric 
6*0b57cec5SDimitry Andric //
7*0b57cec5SDimitry Andric // Common defines for Image intrinsics
8*0b57cec5SDimitry Andric // Channel order
9*0b57cec5SDimitry Andric enum {
10*0b57cec5SDimitry Andric   CLK_R = 0x10B0,
11*0b57cec5SDimitry Andric   CLK_A = 0x10B1,
12*0b57cec5SDimitry Andric   CLK_RG = 0x10B2,
13*0b57cec5SDimitry Andric   CLK_RA = 0x10B3,
14*0b57cec5SDimitry Andric   CLK_RGB = 0x10B4,
15*0b57cec5SDimitry Andric   CLK_RGBA = 0x10B5,
16*0b57cec5SDimitry Andric   CLK_BGRA = 0x10B6,
17*0b57cec5SDimitry Andric   CLK_ARGB = 0x10B7,
18*0b57cec5SDimitry Andric 
19*0b57cec5SDimitry Andric #if (__NV_CL_C_VERSION == __NV_CL_C_VERSION_1_0)
20*0b57cec5SDimitry Andric   CLK_xRGB = 0x10B7,
21*0b57cec5SDimitry Andric #endif
22*0b57cec5SDimitry Andric 
23*0b57cec5SDimitry Andric   CLK_INTENSITY = 0x10B8,
24*0b57cec5SDimitry Andric   CLK_LUMINANCE = 0x10B9
25*0b57cec5SDimitry Andric 
26*0b57cec5SDimitry Andric #if (__NV_CL_C_VERSION >= __NV_CL_C_VERSION_1_1)
27*0b57cec5SDimitry Andric       ,
28*0b57cec5SDimitry Andric   CLK_Rx = 0x10BA,
29*0b57cec5SDimitry Andric   CLK_RGx = 0x10BB,
30*0b57cec5SDimitry Andric   CLK_RGBx = 0x10BC
31*0b57cec5SDimitry Andric #endif
32*0b57cec5SDimitry Andric };
33*0b57cec5SDimitry Andric 
34*0b57cec5SDimitry Andric typedef enum clk_channel_type {
35*0b57cec5SDimitry Andric   // valid formats for float return types
36*0b57cec5SDimitry Andric   CLK_SNORM_INT8 = 0x10D0,  // four channel RGBA unorm8
37*0b57cec5SDimitry Andric   CLK_SNORM_INT16 = 0x10D1, // four channel RGBA unorm16
38*0b57cec5SDimitry Andric   CLK_UNORM_INT8 = 0x10D2,  // four channel RGBA unorm8
39*0b57cec5SDimitry Andric   CLK_UNORM_INT16 = 0x10D3, // four channel RGBA unorm16
40*0b57cec5SDimitry Andric   CLK_HALF_FLOAT = 0x10DD,  // four channel RGBA half
41*0b57cec5SDimitry Andric   CLK_FLOAT = 0x10DE,       // four channel RGBA float
42*0b57cec5SDimitry Andric 
43*0b57cec5SDimitry Andric #if (__NV_CL_C_VERSION >= __NV_CL_C_VERSION_1_1)
44*0b57cec5SDimitry Andric   CLK_UNORM_SHORT_565 = 0x10D4,
45*0b57cec5SDimitry Andric   CLK_UNORM_SHORT_555 = 0x10D5,
46*0b57cec5SDimitry Andric   CLK_UNORM_INT_101010 = 0x10D6,
47*0b57cec5SDimitry Andric #endif
48*0b57cec5SDimitry Andric 
49*0b57cec5SDimitry Andric   // valid only for integer return types
50*0b57cec5SDimitry Andric   CLK_SIGNED_INT8 = 0x10D7,
51*0b57cec5SDimitry Andric   CLK_SIGNED_INT16 = 0x10D8,
52*0b57cec5SDimitry Andric   CLK_SIGNED_INT32 = 0x10D9,
53*0b57cec5SDimitry Andric   CLK_UNSIGNED_INT8 = 0x10DA,
54*0b57cec5SDimitry Andric   CLK_UNSIGNED_INT16 = 0x10DB,
55*0b57cec5SDimitry Andric   CLK_UNSIGNED_INT32 = 0x10DC,
56*0b57cec5SDimitry Andric 
57*0b57cec5SDimitry Andric   // CI SPI for CPU
58*0b57cec5SDimitry Andric   __CLK_UNORM_INT8888,  // four channel ARGB unorm8
59*0b57cec5SDimitry Andric   __CLK_UNORM_INT8888R, // four channel BGRA unorm8
60*0b57cec5SDimitry Andric 
61*0b57cec5SDimitry Andric   __CLK_VALID_IMAGE_TYPE_COUNT,
62*0b57cec5SDimitry Andric   __CLK_INVALID_IMAGE_TYPE = __CLK_VALID_IMAGE_TYPE_COUNT,
63*0b57cec5SDimitry Andric   __CLK_VALID_IMAGE_TYPE_MASK_BITS = 4, // number of bits required to
64*0b57cec5SDimitry Andric                                         // represent any image type
65*0b57cec5SDimitry Andric   __CLK_VALID_IMAGE_TYPE_MASK = (1 << __CLK_VALID_IMAGE_TYPE_MASK_BITS) - 1
66*0b57cec5SDimitry Andric } clk_channel_type;
67*0b57cec5SDimitry Andric 
68*0b57cec5SDimitry Andric typedef enum clk_sampler_type {
69*0b57cec5SDimitry Andric   __CLK_ADDRESS_BASE = 0,
70*0b57cec5SDimitry Andric   CLK_ADDRESS_NONE = 0 << __CLK_ADDRESS_BASE,
71*0b57cec5SDimitry Andric   CLK_ADDRESS_CLAMP = 1 << __CLK_ADDRESS_BASE,
72*0b57cec5SDimitry Andric   CLK_ADDRESS_CLAMP_TO_EDGE = 2 << __CLK_ADDRESS_BASE,
73*0b57cec5SDimitry Andric   CLK_ADDRESS_REPEAT = 3 << __CLK_ADDRESS_BASE,
74*0b57cec5SDimitry Andric   CLK_ADDRESS_MIRROR = 4 << __CLK_ADDRESS_BASE,
75*0b57cec5SDimitry Andric 
76*0b57cec5SDimitry Andric #if (__NV_CL_C_VERSION >= __NV_CL_C_VERSION_1_1)
77*0b57cec5SDimitry Andric   CLK_ADDRESS_MIRRORED_REPEAT = CLK_ADDRESS_MIRROR,
78*0b57cec5SDimitry Andric #endif
79*0b57cec5SDimitry Andric   __CLK_ADDRESS_MASK =
80*0b57cec5SDimitry Andric       CLK_ADDRESS_NONE | CLK_ADDRESS_CLAMP | CLK_ADDRESS_CLAMP_TO_EDGE |
81*0b57cec5SDimitry Andric       CLK_ADDRESS_REPEAT | CLK_ADDRESS_MIRROR,
82*0b57cec5SDimitry Andric   __CLK_ADDRESS_BITS = 3, // number of bits required to
83*0b57cec5SDimitry Andric                           // represent address info
84*0b57cec5SDimitry Andric 
85*0b57cec5SDimitry Andric   __CLK_NORMALIZED_BASE = __CLK_ADDRESS_BITS,
86*0b57cec5SDimitry Andric   CLK_NORMALIZED_COORDS_FALSE = 0,
87*0b57cec5SDimitry Andric   CLK_NORMALIZED_COORDS_TRUE = 1 << __CLK_NORMALIZED_BASE,
88*0b57cec5SDimitry Andric   __CLK_NORMALIZED_MASK =
89*0b57cec5SDimitry Andric       CLK_NORMALIZED_COORDS_FALSE | CLK_NORMALIZED_COORDS_TRUE,
90*0b57cec5SDimitry Andric   __CLK_NORMALIZED_BITS = 1, // number of bits required to
91*0b57cec5SDimitry Andric                              // represent normalization
92*0b57cec5SDimitry Andric 
93*0b57cec5SDimitry Andric   __CLK_FILTER_BASE = __CLK_NORMALIZED_BASE + __CLK_NORMALIZED_BITS,
94*0b57cec5SDimitry Andric   CLK_FILTER_NEAREST = 0 << __CLK_FILTER_BASE,
95*0b57cec5SDimitry Andric   CLK_FILTER_LINEAR = 1 << __CLK_FILTER_BASE,
96*0b57cec5SDimitry Andric   CLK_FILTER_ANISOTROPIC = 2 << __CLK_FILTER_BASE,
97*0b57cec5SDimitry Andric   __CLK_FILTER_MASK =
98*0b57cec5SDimitry Andric       CLK_FILTER_NEAREST | CLK_FILTER_LINEAR | CLK_FILTER_ANISOTROPIC,
99*0b57cec5SDimitry Andric   __CLK_FILTER_BITS = 2, // number of bits required to
100*0b57cec5SDimitry Andric                          // represent address info
101*0b57cec5SDimitry Andric 
102*0b57cec5SDimitry Andric   __CLK_MIP_BASE = __CLK_FILTER_BASE + __CLK_FILTER_BITS,
103*0b57cec5SDimitry Andric   CLK_MIP_NEAREST = 0 << __CLK_MIP_BASE,
104*0b57cec5SDimitry Andric   CLK_MIP_LINEAR = 1 << __CLK_MIP_BASE,
105*0b57cec5SDimitry Andric   CLK_MIP_ANISOTROPIC = 2 << __CLK_MIP_BASE,
106*0b57cec5SDimitry Andric   __CLK_MIP_MASK = CLK_MIP_NEAREST | CLK_MIP_LINEAR | CLK_MIP_ANISOTROPIC,
107*0b57cec5SDimitry Andric   __CLK_MIP_BITS = 2,
108*0b57cec5SDimitry Andric 
109*0b57cec5SDimitry Andric   __CLK_SAMPLER_BITS = __CLK_MIP_BASE + __CLK_MIP_BITS,
110*0b57cec5SDimitry Andric   __CLK_SAMPLER_MASK = __CLK_MIP_MASK | __CLK_FILTER_MASK |
111*0b57cec5SDimitry Andric                        __CLK_NORMALIZED_MASK | __CLK_ADDRESS_MASK,
112*0b57cec5SDimitry Andric 
113*0b57cec5SDimitry Andric   __CLK_ANISOTROPIC_RATIO_BITS = 5,
114*0b57cec5SDimitry Andric   __CLK_ANISOTROPIC_RATIO_MASK =
115*0b57cec5SDimitry Andric       (int) 0x80000000 >> (__CLK_ANISOTROPIC_RATIO_BITS - 1)
116*0b57cec5SDimitry Andric } clk_sampler_type;
117*0b57cec5SDimitry Andric 
118*0b57cec5SDimitry Andric // Memory synchronization
119*0b57cec5SDimitry Andric #define CLK_LOCAL_MEM_FENCE (1 << 0)
120*0b57cec5SDimitry Andric #define CLK_GLOBAL_MEM_FENCE (1 << 1)
121*0b57cec5SDimitry Andric 
122*0b57cec5SDimitry Andric #endif // CL_COMMON_DEFINES_H
123