xref: /freebsd/contrib/llvm-project/clang/lib/Sema/OpenCLBuiltins.td (revision 0fca6ea1d4eea4c934cfff25ac9ee8ad6fe95583)
1//==--- OpenCLBuiltins.td - OpenCL builtin declarations -------------------===//
2//
3//                     The LLVM Compiler Infrastructure
4//
5// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
6// See https://llvm.org/LICENSE.txt for license information.
7// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
8//
9//===----------------------------------------------------------------------===//
10//
11// This file contains TableGen definitions for OpenCL builtin function
12// declarations.  In case of an unresolved function name in OpenCL, Clang will
13// check for a function described in this file when -fdeclare-opencl-builtins
14// is specified.
15//
16//===----------------------------------------------------------------------===//
17
18//===----------------------------------------------------------------------===//
19//              Definitions of miscellaneous basic entities.
20//===----------------------------------------------------------------------===//
21// Versions of OpenCL
22class Version<int _Version> {
23  int ID = _Version;
24}
25def CLAll : Version<  0>;
26def CL10  : Version<100>;
27def CL11  : Version<110>;
28def CL12  : Version<120>;
29def CL20  : Version<200>;
30
31// Address spaces
32// Pointer types need to be assigned an address space.
33class AddressSpace<string _AS> {
34  string Name = _AS;
35}
36def DefaultAS    : AddressSpace<"clang::LangAS::Default">;
37def PrivateAS    : AddressSpace<"clang::LangAS::opencl_private">;
38def GlobalAS     : AddressSpace<"clang::LangAS::opencl_global">;
39def ConstantAS   : AddressSpace<"clang::LangAS::opencl_constant">;
40def LocalAS      : AddressSpace<"clang::LangAS::opencl_local">;
41def GenericAS    : AddressSpace<"clang::LangAS::opencl_generic">;
42
43// OpenCL language extension.
44class AbstractExtension<string _Ext> {
45  // One or more OpenCL extensions, space separated.  Each extension must be
46  // a valid extension name for the opencl extension pragma.
47  string ExtName = _Ext;
48}
49
50// Extension associated to a builtin function.
51class FunctionExtension<string _Ext> : AbstractExtension<_Ext>;
52
53// Extension associated to a type.  This enables implicit conditionalization of
54// builtin function overloads containing a type that depends on an extension.
55// During overload resolution, when a builtin function overload contains a type
56// with a TypeExtension, those overloads are skipped when the extension is
57// disabled.
58class TypeExtension<string _Ext> : AbstractExtension<_Ext>;
59
60// Concatenate zero or more space-separated extensions in NewExts to Base and
61// return the resulting FunctionExtension in ret.
62class concatExtension<FunctionExtension Base, string NewExts> {
63  FunctionExtension ret = FunctionExtension<
64    !cond(
65      // Return Base extension if NewExts is empty,
66      !empty(NewExts) : Base.ExtName,
67
68      // otherwise, return NewExts if Base extension is empty,
69      !empty(Base.ExtName) : NewExts,
70
71      // otherwise, concatenate NewExts to Base.
72      true : Base.ExtName # " " # NewExts
73    )
74  >;
75}
76
77// TypeExtension definitions.
78def NoTypeExt   : TypeExtension<"">;
79def Fp16TypeExt : TypeExtension<"cl_khr_fp16">;
80def Fp64TypeExt : TypeExtension<"cl_khr_fp64">;
81def Atomic64TypeExt : TypeExtension<"cl_khr_int64_base_atomics cl_khr_int64_extended_atomics">;
82def AtomicFp64TypeExt : TypeExtension<"cl_khr_int64_base_atomics cl_khr_int64_extended_atomics cl_khr_fp64">;
83
84// FunctionExtension definitions.
85def FuncExtNone                          : FunctionExtension<"">;
86def FuncExtKhrSubgroups                  : FunctionExtension<"__opencl_subgroup_builtins">;
87def FuncExtKhrSubgroupExtendedTypes      : FunctionExtension<"cl_khr_subgroup_extended_types">;
88def FuncExtKhrSubgroupNonUniformVote     : FunctionExtension<"cl_khr_subgroup_non_uniform_vote">;
89def FuncExtKhrSubgroupBallot             : FunctionExtension<"cl_khr_subgroup_ballot">;
90def FuncExtKhrSubgroupNonUniformArithmetic: FunctionExtension<"cl_khr_subgroup_non_uniform_arithmetic">;
91def FuncExtKhrSubgroupShuffle            : FunctionExtension<"cl_khr_subgroup_shuffle">;
92def FuncExtKhrSubgroupShuffleRelative    : FunctionExtension<"cl_khr_subgroup_shuffle_relative">;
93def FuncExtKhrSubgroupClusteredReduce    : FunctionExtension<"cl_khr_subgroup_clustered_reduce">;
94def FuncExtKhrExtendedBitOps             : FunctionExtension<"cl_khr_extended_bit_ops">;
95def FuncExtKhrGlobalInt32BaseAtomics     : FunctionExtension<"cl_khr_global_int32_base_atomics">;
96def FuncExtKhrGlobalInt32ExtendedAtomics : FunctionExtension<"cl_khr_global_int32_extended_atomics">;
97def FuncExtKhrLocalInt32BaseAtomics      : FunctionExtension<"cl_khr_local_int32_base_atomics">;
98def FuncExtKhrLocalInt32ExtendedAtomics  : FunctionExtension<"cl_khr_local_int32_extended_atomics">;
99def FuncExtKhrInt64BaseAtomics           : FunctionExtension<"cl_khr_int64_base_atomics">;
100def FuncExtKhrInt64ExtendedAtomics       : FunctionExtension<"cl_khr_int64_extended_atomics">;
101def FuncExtKhrMipmapImage                : FunctionExtension<"cl_khr_mipmap_image">;
102def FuncExtKhrMipmapImageWrites          : FunctionExtension<"cl_khr_mipmap_image_writes">;
103def FuncExtKhrGlMsaaSharing              : FunctionExtension<"cl_khr_gl_msaa_sharing">;
104
105def FuncExtOpenCLCDeviceEnqueue          : FunctionExtension<"__opencl_c_device_enqueue">;
106def FuncExtOpenCLCGenericAddressSpace    : FunctionExtension<"__opencl_c_generic_address_space">;
107def FuncExtOpenCLCNamedAddressSpaceBuiltins : FunctionExtension<"__opencl_c_named_address_space_builtins">;
108def FuncExtOpenCLCPipes                  : FunctionExtension<"__opencl_c_pipes">;
109def FuncExtOpenCLCWGCollectiveFunctions  : FunctionExtension<"__opencl_c_work_group_collective_functions">;
110def FuncExtOpenCLCReadWriteImages        : FunctionExtension<"__opencl_c_read_write_images">;
111def FuncExtFloatAtomicsFp16GlobalASLoadStore  : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp16_global_atomic_load_store">;
112def FuncExtFloatAtomicsFp16LocalASLoadStore   : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp16_local_atomic_load_store">;
113def FuncExtFloatAtomicsFp16GenericASLoadStore : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp16_global_atomic_load_store __opencl_c_ext_fp16_local_atomic_load_store">;
114def FuncExtFloatAtomicsFp16GlobalASAdd        : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp16_global_atomic_add">;
115def FuncExtFloatAtomicsFp32GlobalASAdd        : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp32_global_atomic_add">;
116def FuncExtFloatAtomicsFp64GlobalASAdd        : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp64_global_atomic_add">;
117def FuncExtFloatAtomicsFp16LocalASAdd         : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp16_local_atomic_add">;
118def FuncExtFloatAtomicsFp32LocalASAdd         : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp32_local_atomic_add">;
119def FuncExtFloatAtomicsFp64LocalASAdd         : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp64_local_atomic_add">;
120def FuncExtFloatAtomicsFp16GenericASAdd       : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp16_local_atomic_add __opencl_c_ext_fp16_global_atomic_add">;
121def FuncExtFloatAtomicsFp32GenericASAdd       : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp32_local_atomic_add __opencl_c_ext_fp32_global_atomic_add">;
122def FuncExtFloatAtomicsFp64GenericASAdd       : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp64_local_atomic_add __opencl_c_ext_fp64_global_atomic_add">;
123def FuncExtFloatAtomicsFp16GlobalASMinMax     : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp16_global_atomic_min_max">;
124def FuncExtFloatAtomicsFp32GlobalASMinMax     : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp32_global_atomic_min_max">;
125def FuncExtFloatAtomicsFp64GlobalASMinMax     : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp64_global_atomic_min_max">;
126def FuncExtFloatAtomicsFp16LocalASMinMax      : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp16_local_atomic_min_max">;
127def FuncExtFloatAtomicsFp32LocalASMinMax      : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp32_local_atomic_min_max">;
128def FuncExtFloatAtomicsFp64LocalASMinMax      : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp64_local_atomic_min_max">;
129def FuncExtFloatAtomicsFp16GenericASMinMax    : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp16_local_atomic_min_max __opencl_c_ext_fp16_global_atomic_min_max">;
130def FuncExtFloatAtomicsFp32GenericASMinMax    : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp32_local_atomic_min_max __opencl_c_ext_fp32_global_atomic_min_max">;
131def FuncExtFloatAtomicsFp64GenericASMinMax    : FunctionExtension<"cl_ext_float_atomics __opencl_c_ext_fp64_local_atomic_min_max __opencl_c_ext_fp64_global_atomic_min_max">;
132
133// Not a real extension, but a workaround to add C++ for OpenCL specific builtins.
134def FuncExtOpenCLCxx                     : FunctionExtension<"__cplusplus">;
135
136// Arm extensions.
137def ArmIntegerDotProductInt8                   : FunctionExtension<"cl_arm_integer_dot_product_int8">;
138def ArmIntegerDotProductAccumulateInt8         : FunctionExtension<"cl_arm_integer_dot_product_accumulate_int8">;
139def ArmIntegerDotProductAccumulateInt16        : FunctionExtension<"cl_arm_integer_dot_product_accumulate_int16">;
140def ArmIntegerDotProductAccumulateSaturateInt8 : FunctionExtension<"cl_arm_integer_dot_product_accumulate_saturate_int8">;
141
142// Qualified Type.  These map to ASTContext::QualType.
143class QualType<string _TypeExpr, bit _IsAbstract=0> {
144  // Expression to obtain the QualType inside OCL2Qual.
145  // E.g. TypeExpr="Context.IntTy" for the int type.
146  string TypeExpr = _TypeExpr;
147  // Some QualTypes in this file represent an abstract type for which there is
148  // no corresponding AST QualType, e.g. a GenType or an `image2d_t` type
149  // without access qualifiers.
150  bit IsAbstract = _IsAbstract;
151}
152
153// List of integers.
154class IntList<string _Name, list<int> _List> {
155  string Name = _Name;
156  list<int> List = _List;
157}
158
159//===----------------------------------------------------------------------===//
160//                      OpenCL C classes for types
161//===----------------------------------------------------------------------===//
162// OpenCL C basic data types (int, float, image2d_t, ...).
163// Its child classes can represent concrete types (e.g. VectorType) or
164// abstract types (e.g. GenType).
165class Type<string _Name, QualType _QTExpr> {
166  // Name of the Type.
167  string Name = _Name;
168  // QualType associated with this type.
169  QualType QTExpr = _QTExpr;
170  // Size of the vector (if applicable).
171  int VecWidth = 1;
172  // Is a pointer.
173  bit IsPointer = 0;
174  // "const" qualifier.
175  bit IsConst = 0;
176  // "volatile" qualifier.
177  bit IsVolatile = 0;
178  // Access qualifier. Must be one of ("RO", "WO", "RW").
179  string AccessQualifier = "";
180  // Address space.
181  string AddrSpace = DefaultAS.Name;
182  // Extension that needs to be enabled to expose a builtin that uses this type.
183  TypeExtension Extension = NoTypeExt;
184}
185
186// OpenCL vector types (e.g. int2, int3, int16, float8, ...).
187class VectorType<Type _Ty, int _VecWidth> : Type<_Ty.Name, _Ty.QTExpr> {
188  let VecWidth = _VecWidth;
189  let AccessQualifier = "";
190  // Inherited fields
191  let IsPointer = _Ty.IsPointer;
192  let IsConst = _Ty.IsConst;
193  let IsVolatile = _Ty.IsVolatile;
194  let AddrSpace = _Ty.AddrSpace;
195  let Extension = _Ty.Extension;
196}
197
198// OpenCL pointer types (e.g. int*, float*, ...).
199class PointerType<Type _Ty, AddressSpace _AS = DefaultAS> :
200    Type<_Ty.Name, _Ty.QTExpr> {
201  let AddrSpace = _AS.Name;
202  // Inherited fields
203  let VecWidth = _Ty.VecWidth;
204  let IsPointer = 1;
205  let IsConst = _Ty.IsConst;
206  let IsVolatile = _Ty.IsVolatile;
207  let AccessQualifier = _Ty.AccessQualifier;
208  let Extension = _Ty.Extension;
209}
210
211// OpenCL const types (e.g. const int).
212class ConstType<Type _Ty> : Type<_Ty.Name, _Ty.QTExpr> {
213  let IsConst = 1;
214  // Inherited fields
215  let VecWidth = _Ty.VecWidth;
216  let IsPointer = _Ty.IsPointer;
217  let IsVolatile = _Ty.IsVolatile;
218  let AccessQualifier = _Ty.AccessQualifier;
219  let AddrSpace = _Ty.AddrSpace;
220  let Extension = _Ty.Extension;
221}
222
223// OpenCL volatile types (e.g. volatile int).
224class VolatileType<Type _Ty> : Type<_Ty.Name, _Ty.QTExpr> {
225  let IsVolatile = 1;
226  // Inherited fields
227  let VecWidth = _Ty.VecWidth;
228  let IsPointer = _Ty.IsPointer;
229  let IsConst = _Ty.IsConst;
230  let AccessQualifier = _Ty.AccessQualifier;
231  let AddrSpace = _Ty.AddrSpace;
232  let Extension = _Ty.Extension;
233}
234
235// OpenCL image types (e.g. image2d).
236class ImageType<Type _Ty, string _AccessQualifier> :
237    Type<_Ty.Name, QualType<_Ty.QTExpr.TypeExpr # _AccessQualifier # "Ty", 0>> {
238  let VecWidth = 0;
239  let AccessQualifier = _AccessQualifier;
240  // Inherited fields
241  let IsPointer = _Ty.IsPointer;
242  let IsConst = _Ty.IsConst;
243  let IsVolatile = _Ty.IsVolatile;
244  let AddrSpace = _Ty.AddrSpace;
245  // Add TypeExtensions for writable "image3d_t" and "read_write" image types.
246  let Extension = !cond(
247      !and(!eq(_Ty.Name, "image3d_t"), !eq(_AccessQualifier, "WO")) : TypeExtension<"cl_khr_3d_image_writes">,
248      !and(!eq(_Ty.Name, "image3d_t"), !eq(_AccessQualifier, "RW")) : TypeExtension<"cl_khr_3d_image_writes __opencl_c_read_write_images">,
249      !or(!eq(_Ty.Name, "image2d_depth_t"), !eq(_Ty.Name, "image2d_array_depth_t")) : TypeExtension<"cl_khr_depth_images">,
250      !eq(_AccessQualifier, "RW") : TypeExtension<"__opencl_c_read_write_images">,
251      true : _Ty.Extension);
252}
253
254// OpenCL enum type (e.g. memory_scope).
255class EnumType<string _Name> :
256    Type<_Name, QualType<"getOpenCLEnumType(S, \"" # _Name # "\")", 0>> {
257}
258
259// OpenCL typedef type (e.g. cl_mem_fence_flags).
260class TypedefType<string _Name> :
261    Type<_Name, QualType<"getOpenCLTypedefType(S, \"" # _Name # "\")", 0>> {
262}
263
264// List of Types.
265class TypeList<list<Type> _Type> {
266  list<Type> List = _Type;
267}
268
269// A GenericType is an abstract type that defines a set of types as a
270// combination of Types and vector sizes.
271//
272// For example, if TypeList = <int, float> and VectorList = <1, 2, 4>, then it
273// represents <int, int2, int4, float, float2, float4>.
274//
275// Some rules apply when using multiple GenericType arguments in a declaration:
276//   1. The number of vector sizes must be equal or 1 for all gentypes in a
277//      declaration.
278//   2. The number of Types must be equal or 1 for all gentypes in a
279//      declaration.
280//   3. Generic types are combined by iterating over all generic types at once.
281//      For example, for the following GenericTypes
282//        GenT1 = GenericType<half, [1, 2]> and
283//        GenT2 = GenericType<float, int, [1, 2]>
284//      A declaration f(GenT1, GenT2) results in the combinations
285//        f(half, float), f(half2, float2), f(half, int), f(half2, int2) .
286//   4. "sgentype" from the OpenCL specification is supported by specifying
287//      a single vector size.
288//      For example, for the following GenericTypes
289//        GenT = GenericType<half, int, [1, 2]> and
290//        SGenT = GenericType<half, int, [1]>
291//      A declaration f(GenT, SGenT) results in the combinations
292//        f(half, half), f(half2, half), f(int, int), f(int2, int) .
293class GenericType<string _Ty, TypeList _TypeList, IntList _VectorList> :
294    Type<_Ty, QualType<"null", 1>> {
295  // Possible element types of the generic type.
296  TypeList TypeList = _TypeList;
297  // Possible vector sizes of the types in the TypeList.
298  IntList VectorList = _VectorList;
299  // The VecWidth field is ignored for GenericTypes. Use VectorList instead.
300  let VecWidth = 0;
301}
302
303// Builtin function attributes.
304def Attr {
305  list<bit> None = [0, 0, 0];
306  list<bit> Pure = [1, 0, 0];
307  list<bit> Const = [0, 1, 0];
308  list<bit> Convergent = [0, 0, 1];
309}
310
311//===----------------------------------------------------------------------===//
312//                      OpenCL C class for builtin functions
313//===----------------------------------------------------------------------===//
314class Builtin<string _Name, list<Type> _Signature, list<bit> _Attributes = Attr.None> {
315  // Name of the builtin function
316  string Name = _Name;
317  // List of types used by the function. The first one is the return type and
318  // the following are the arguments. The list must have at least one element
319  // (the return type).
320  list<Type> Signature = _Signature;
321  // Function attribute __attribute__((pure))
322  bit IsPure = _Attributes[0];
323  // Function attribute __attribute__((const))
324  bit IsConst = _Attributes[1];
325  // Function attribute __attribute__((convergent))
326  bit IsConv = _Attributes[2];
327  // OpenCL extensions to which the function belongs.
328  FunctionExtension Extension = FuncExtNone;
329  // Version of OpenCL from which the function is available (e.g.: CL10).
330  // MinVersion is inclusive.
331  Version MinVersion = CL10;
332  // Version of OpenCL from which the function is not supported anymore.
333  // MaxVersion is exclusive.
334  // CLAll makes the function available for all versions.
335  Version MaxVersion = CLAll;
336}
337
338//===----------------------------------------------------------------------===//
339//                 Definitions of OpenCL C types
340//===----------------------------------------------------------------------===//
341
342// OpenCL v1.0/1.2/2.0 s6.1.1: Built-in Scalar Data Types.
343def Bool      : Type<"bool",      QualType<"Context.BoolTy">>;
344def Char      : Type<"char",      QualType<"Context.CharTy">>;
345def UChar     : Type<"uchar",     QualType<"Context.UnsignedCharTy">>;
346def Short     : Type<"short",     QualType<"Context.ShortTy">>;
347def UShort    : Type<"ushort",    QualType<"Context.UnsignedShortTy">>;
348def Int       : Type<"int",       QualType<"Context.IntTy">>;
349def UInt      : Type<"uint",      QualType<"Context.UnsignedIntTy">>;
350def Long      : Type<"long",      QualType<"Context.LongTy">>;
351def ULong     : Type<"ulong",     QualType<"Context.UnsignedLongTy">>;
352def Float     : Type<"float",     QualType<"Context.FloatTy">>;
353let Extension = Fp64TypeExt in {
354  def Double    : Type<"double",    QualType<"Context.DoubleTy">>;
355}
356
357// The half type for builtins that require the cl_khr_fp16 extension.
358let Extension = Fp16TypeExt in {
359  def Half      : Type<"half",      QualType<"Context.HalfTy">>;
360}
361
362// Without the cl_khr_fp16 extension, the half type can only be used to declare
363// a pointer.  Define const and non-const pointer types in all address spaces.
364// Use the "__half" alias to allow the TableGen emitter to distinguish the
365// (extensionless) pointee type of these pointer-to-half types from the "half"
366// type defined above that already carries the cl_khr_fp16 extension.
367foreach AS = [PrivateAS, GlobalAS, ConstantAS, LocalAS, GenericAS] in {
368  def "HalfPtr" # AS      : PointerType<Type<"__half", QualType<"Context.HalfTy">>, AS>;
369  def "HalfPtrConst" # AS : PointerType<ConstType<Type<"__half", QualType<"Context.HalfTy">>>, AS>;
370}
371
372def Size      : Type<"size_t",    QualType<"Context.getSizeType()">>;
373def PtrDiff   : Type<"ptrdiff_t", QualType<"Context.getPointerDiffType()">>;
374def IntPtr    : Type<"intptr_t",  QualType<"Context.getIntPtrType()">>;
375def UIntPtr   : Type<"uintptr_t", QualType<"Context.getUIntPtrType()">>;
376def Void      : Type<"void",      QualType<"Context.VoidTy">>;
377
378// OpenCL v1.0/1.2/2.0 s6.1.2: Built-in Vector Data Types.
379// Built-in vector data types are created by TableGen's OpenCLBuiltinEmitter.
380
381// OpenCL v1.0/1.2/2.0 s6.1.3: Other Built-in Data Types.
382// The image definitions are "abstract".  They should not be used without
383// specifying an access qualifier (RO/WO/RW).
384def Image1d               : Type<"image1d_t", QualType<"Context.OCLImage1d", 1>>;
385def Image2d               : Type<"image2d_t", QualType<"Context.OCLImage2d", 1>>;
386def Image3d               : Type<"image3d_t", QualType<"Context.OCLImage3d", 1>>;
387def Image1dArray          : Type<"image1d_array_t", QualType<"Context.OCLImage1dArray", 1>>;
388def Image1dBuffer         : Type<"image1d_buffer_t", QualType<"Context.OCLImage1dBuffer", 1>>;
389def Image2dArray          : Type<"image2d_array_t", QualType<"Context.OCLImage2dArray", 1>>;
390def Image2dDepth          : Type<"image2d_depth_t", QualType<"Context.OCLImage2dDepth", 1>>;
391def Image2dArrayDepth     : Type<"image2d_array_depth_t", QualType<"Context.OCLImage2dArrayDepth", 1>>;
392def Image2dMsaa           : Type<"image2d_msaa_t", QualType<"Context.OCLImage2dMSAA", 1>>;
393def Image2dArrayMsaa      : Type<"image2d_array_msaa_t", QualType<"Context.OCLImage2dArrayMSAA", 1>>;
394def Image2dMsaaDepth      : Type<"image2d_msaa_depth_t", QualType<"Context.OCLImage2dMSAADepth", 1>>;
395def Image2dArrayMsaaDepth : Type<"image2d_array_msaa_depth_t", QualType<"Context.OCLImage2dArrayMSAADepth", 1>>;
396
397def Sampler               : Type<"sampler_t", QualType<"Context.OCLSamplerTy">>;
398def ClkEvent              : Type<"clk_event_t", QualType<"Context.OCLClkEventTy">>;
399def Event                 : Type<"event_t", QualType<"Context.OCLEventTy">>;
400def Queue                 : Type<"queue_t", QualType<"Context.OCLQueueTy">>;
401def ReserveId             : Type<"reserve_id_t", QualType<"Context.OCLReserveIDTy">>;
402def MemFenceFlags         : TypedefType<"cl_mem_fence_flags">;
403def ClkProfilingInfo      : TypedefType<"clk_profiling_info">;
404def NDRange               : TypedefType<"ndrange_t">;
405
406// OpenCL v2.0 s6.13.11: Atomic integer and floating-point types.
407def AtomicInt             : Type<"atomic_int", QualType<"Context.getAtomicType(Context.IntTy)">>;
408def AtomicUInt            : Type<"atomic_uint", QualType<"Context.getAtomicType(Context.UnsignedIntTy)">>;
409let Extension = Atomic64TypeExt in {
410  def AtomicLong            : Type<"atomic_long", QualType<"Context.getAtomicType(Context.LongTy)">>;
411  def AtomicULong           : Type<"atomic_ulong", QualType<"Context.getAtomicType(Context.UnsignedLongTy)">>;
412}
413def AtomicFloat           : Type<"atomic_float", QualType<"Context.getAtomicType(Context.FloatTy)">>;
414let Extension = AtomicFp64TypeExt in {
415  def AtomicDouble          : Type<"atomic_double", QualType<"Context.getAtomicType(Context.DoubleTy)">>;
416}
417def AtomicHalf            : Type<"atomic_half", QualType<"Context.getAtomicType(Context.HalfTy)">>;
418def AtomicIntPtr          : Type<"atomic_intptr_t", QualType<"Context.getAtomicType(Context.getIntPtrType())">>;
419def AtomicUIntPtr         : Type<"atomic_uintptr_t", QualType<"Context.getAtomicType(Context.getUIntPtrType())">>;
420def AtomicSize            : Type<"atomic_size_t", QualType<"Context.getAtomicType(Context.getSizeType())">>;
421def AtomicPtrDiff         : Type<"atomic_ptrdiff_t", QualType<"Context.getAtomicType(Context.getPointerDiffType())">>;
422
423def AtomicFlag            : TypedefType<"atomic_flag">;
424def MemoryOrder           : EnumType<"memory_order">;
425def MemoryScope           : EnumType<"memory_scope">;
426
427//===----------------------------------------------------------------------===//
428//                 Definitions of OpenCL gentype variants
429//===----------------------------------------------------------------------===//
430// The OpenCL specification often uses "gentype" in builtin function
431// declarations to indicate that a builtin function is available with various
432// argument and return types.  The types represented by "gentype" vary between
433// different parts of the specification.  The following definitions capture
434// the different type lists for gentypes in different parts of the
435// specification.
436
437// Vector width lists.
438def VecAndScalar: IntList<"VecAndScalar", [1, 2, 3, 4, 8, 16]>;
439def VecNoScalar : IntList<"VecNoScalar", [2, 3, 4, 8, 16]>;
440def Vec1        : IntList<"Vec1", [1]>;
441def Vec1234     : IntList<"Vec1234", [1, 2, 3, 4]>;
442
443// Type lists.
444def TLAll           : TypeList<[Char,  UChar, Short,  UShort, Int,  UInt, Long,  ULong, Float, Double, Half]>;
445def TLFloat         : TypeList<[Float, Double, Half]>;
446def TLSignedInts    : TypeList<[Char, Short, Int, Long]>;
447def TLUnsignedInts  : TypeList<[UChar, UShort, UInt, ULong]>;
448
449def TLIntLongFloats : TypeList<[Int, UInt, Long, ULong, Float, Double, Half]>;
450
451// All unsigned integer types twice, to facilitate unsigned return types for e.g.
452// uchar abs(char) and
453// uchar abs(uchar).
454def TLAllUIntsTwice : TypeList<[UChar, UChar, UShort, UShort, UInt, UInt, ULong, ULong]>;
455
456def TLAllInts       : TypeList<[Char, UChar, Short, UShort, Int, UInt, Long, ULong]>;
457
458// GenType definitions for multiple base types (e.g. all floating point types,
459// or all integer types).
460// All types
461def AGenType1              : GenericType<"AGenType1", TLAll, Vec1>;
462def AGenTypeN              : GenericType<"AGenTypeN", TLAll, VecAndScalar>;
463def AGenTypeNNoScalar      : GenericType<"AGenTypeNNoScalar", TLAll, VecNoScalar>;
464// All integer
465def AIGenType1             : GenericType<"AIGenType1", TLAllInts, Vec1>;
466def AIGenTypeN             : GenericType<"AIGenTypeN", TLAllInts, VecAndScalar>;
467def AIGenTypeNNoScalar     : GenericType<"AIGenTypeNNoScalar", TLAllInts, VecNoScalar>;
468// All integer to unsigned
469def AI2UGenTypeN           : GenericType<"AI2UGenTypeN", TLAllUIntsTwice, VecAndScalar>;
470// Signed integer
471def SGenTypeN              : GenericType<"SGenTypeN", TLSignedInts, VecAndScalar>;
472// Unsigned integer
473def UGenTypeN              : GenericType<"UGenTypeN", TLUnsignedInts, VecAndScalar>;
474// Float
475def FGenTypeN              : GenericType<"FGenTypeN", TLFloat, VecAndScalar>;
476// (u)int, (u)long, and all floats
477def IntLongFloatGenType1   : GenericType<"IntLongFloatGenType1", TLIntLongFloats, Vec1>;
478// (u)char and (u)short
479def CharShortGenType1      : GenericType<"CharShortGenType1",
480                                 TypeList<[Char, UChar, Short, UShort]>, Vec1>;
481
482// GenType definitions for every single base type (e.g. fp32 only).
483// Names are like: GenTypeFloatVecAndScalar.
484foreach Type = [Char, UChar, Short, UShort,
485                Int, UInt, Long, ULong,
486                Float, Double, Half] in {
487  foreach VecSizes = [VecAndScalar, VecNoScalar] in {
488    def "GenType" # Type # VecSizes :
489              GenericType<"GenType" # Type # VecSizes,
490                          TypeList<[Type]>, VecSizes>;
491  }
492}
493
494// GenType definitions for vec1234.
495foreach Type = [Float, Double, Half] in {
496  def "GenType" # Type # Vec1234 :
497              GenericType<"GenType" # Type # Vec1234,
498                          TypeList<[Type]>, Vec1234>;
499}
500
501
502//===----------------------------------------------------------------------===//
503//                 Definitions of OpenCL builtin functions
504//===----------------------------------------------------------------------===//
505//--------------------------------------------------------------------
506// OpenCL v1.1/1.2/2.0 s6.2.3 - Explicit conversions.
507// OpenCL v2.0 Extensions s5.1.1 and s6.1.1 - Conversions.
508
509// Generate the convert_* builtins functions.
510foreach RType = [Float, Double, Half, Char, UChar, Short,
511                 UShort, Int, UInt, Long, ULong] in {
512  foreach IType = [Float, Double, Half, Char, UChar, Short,
513                   UShort, Int, UInt, Long, ULong] in {
514    // Conversions to integer type have a sat and non-sat variant.
515    foreach sat = !cond(!eq(RType.Name, "float") : [""],
516                        !eq(RType.Name, "double") : [""],
517                        !eq(RType.Name, "half") : [""],
518                        1 : ["", "_sat"]) in {
519      foreach rnd = ["", "_rte", "_rtn", "_rtp", "_rtz"] in {
520        def : Builtin<"convert_" # RType.Name # sat # rnd, [RType, IType],
521                      Attr.Const>;
522        foreach v = [2, 3, 4, 8, 16] in {
523          def : Builtin<"convert_" # RType.Name # v # sat # rnd,
524                        [VectorType<RType, v>, VectorType<IType, v>],
525                        Attr.Const>;
526        }
527      }
528    }
529  }
530}
531
532//--------------------------------------------------------------------
533// OpenCL v1.1 s6.11.1, v1.2 s6.12.1, v2.0 s6.13.1 - Work-item Functions
534// --- Table 7 ---
535def : Builtin<"get_work_dim", [UInt], Attr.Const>;
536foreach name = ["get_global_size", "get_global_id", "get_local_size",
537                "get_local_id", "get_num_groups", "get_group_id",
538                "get_global_offset"] in {
539  def : Builtin<name, [Size, UInt], Attr.Const>;
540}
541
542let MinVersion = CL20 in {
543  def : Builtin<"get_enqueued_local_size", [Size, UInt]>;
544  foreach name = ["get_global_linear_id", "get_local_linear_id"] in {
545    def : Builtin<name, [Size]>;
546  }
547}
548
549
550//--------------------------------------------------------------------
551// OpenCL v1.1 s6.11.2, v1.2 s6.12.2, v2.0 s6.13.2 - Math functions
552// OpenCL Extension v2.0 s5.1.2 and s6.1.2 - Math Functions
553// --- Table 8 ---
554// --- 1 argument ---
555foreach name = ["acos", "acosh", "acospi",
556                "asin", "asinh", "asinpi",
557                "atan", "atanh", "atanpi",
558                "cbrt", "ceil",
559                "cos", "cosh", "cospi",
560                "erfc", "erf",
561                "exp", "exp2", "exp10", "expm1",
562                "fabs", "floor",
563                "log", "log2", "log10", "log1p", "logb",
564                "rint", "round", "rsqrt",
565                "sin", "sinh", "sinpi",
566                "sqrt",
567                "tan", "tanh", "tanpi",
568                "tgamma", "trunc",
569                "lgamma"] in {
570    def : Builtin<name, [FGenTypeN, FGenTypeN], Attr.Const>;
571}
572foreach name = ["nan"] in {
573  def : Builtin<name, [GenTypeFloatVecAndScalar, GenTypeUIntVecAndScalar], Attr.Const>;
574  def : Builtin<name, [GenTypeDoubleVecAndScalar, GenTypeULongVecAndScalar], Attr.Const>;
575  def : Builtin<name, [GenTypeHalfVecAndScalar, GenTypeUShortVecAndScalar], Attr.Const>;
576}
577
578// --- 2 arguments ---
579foreach name = ["atan2", "atan2pi", "copysign", "fdim", "fmod", "hypot",
580                "maxmag", "minmag", "nextafter", "pow", "powr",
581                "remainder"] in {
582  def : Builtin<name, [FGenTypeN, FGenTypeN, FGenTypeN], Attr.Const>;
583}
584foreach name = ["fmax", "fmin"] in {
585  def : Builtin<name, [FGenTypeN, FGenTypeN, FGenTypeN], Attr.Const>;
586  def : Builtin<name, [GenTypeFloatVecNoScalar, GenTypeFloatVecNoScalar, Float], Attr.Const>;
587  def : Builtin<name, [GenTypeDoubleVecNoScalar, GenTypeDoubleVecNoScalar, Double], Attr.Const>;
588  def : Builtin<name, [GenTypeHalfVecNoScalar, GenTypeHalfVecNoScalar, Half], Attr.Const>;
589}
590foreach name = ["ilogb"] in {
591  def : Builtin<name, [GenTypeIntVecAndScalar, GenTypeFloatVecAndScalar], Attr.Const>;
592  def : Builtin<name, [GenTypeIntVecAndScalar, GenTypeDoubleVecAndScalar], Attr.Const>;
593  def : Builtin<name, [GenTypeIntVecAndScalar, GenTypeHalfVecAndScalar], Attr.Const>;
594}
595foreach name = ["ldexp"] in {
596  def : Builtin<name, [GenTypeFloatVecAndScalar, GenTypeFloatVecAndScalar, GenTypeIntVecAndScalar], Attr.Const>;
597  def : Builtin<name, [GenTypeFloatVecNoScalar, GenTypeFloatVecNoScalar, Int], Attr.Const>;
598  def : Builtin<name, [GenTypeDoubleVecAndScalar, GenTypeDoubleVecAndScalar, GenTypeIntVecAndScalar], Attr.Const>;
599  def : Builtin<name, [GenTypeDoubleVecNoScalar, GenTypeDoubleVecNoScalar, Int], Attr.Const>;
600  def : Builtin<name, [GenTypeHalfVecAndScalar, GenTypeHalfVecAndScalar, GenTypeIntVecAndScalar], Attr.Const>;
601  def : Builtin<name, [GenTypeHalfVecNoScalar, GenTypeHalfVecNoScalar, Int], Attr.Const>;
602}
603foreach name = ["pown", "rootn"] in {
604  def : Builtin<name, [GenTypeFloatVecAndScalar, GenTypeFloatVecAndScalar, GenTypeIntVecAndScalar], Attr.Const>;
605  def : Builtin<name, [GenTypeDoubleVecAndScalar, GenTypeDoubleVecAndScalar, GenTypeIntVecAndScalar], Attr.Const>;
606  def : Builtin<name, [GenTypeHalfVecAndScalar, GenTypeHalfVecAndScalar, GenTypeIntVecAndScalar], Attr.Const>;
607}
608
609// --- 3 arguments ---
610foreach name = ["fma", "mad"] in {
611  def : Builtin<name, [FGenTypeN, FGenTypeN, FGenTypeN, FGenTypeN], Attr.Const>;
612}
613
614// The following math builtins take pointer arguments.  Which overloads are
615// available depends on whether the generic address space feature is enabled.
616multiclass MathWithPointer<list<AddressSpace> addrspaces> {
617  foreach AS = addrspaces in {
618    foreach name = ["fract", "modf", "sincos"] in {
619      def : Builtin<name, [FGenTypeN, FGenTypeN, PointerType<FGenTypeN, AS>]>;
620    }
621    foreach name = ["frexp", "lgamma_r"] in {
622      foreach Type = [GenTypeFloatVecAndScalar, GenTypeDoubleVecAndScalar, GenTypeHalfVecAndScalar] in {
623        def : Builtin<name, [Type, Type, PointerType<GenTypeIntVecAndScalar, AS>]>;
624      }
625    }
626    foreach name = ["remquo"] in {
627      foreach Type = [GenTypeFloatVecAndScalar, GenTypeDoubleVecAndScalar, GenTypeHalfVecAndScalar] in {
628        def : Builtin<name, [Type, Type, Type, PointerType<GenTypeIntVecAndScalar, AS>]>;
629      }
630    }
631  }
632}
633
634let Extension = FuncExtOpenCLCNamedAddressSpaceBuiltins in {
635  defm : MathWithPointer<[GlobalAS, LocalAS, PrivateAS]>;
636}
637let Extension = FuncExtOpenCLCGenericAddressSpace in {
638  defm : MathWithPointer<[GenericAS]>;
639}
640
641// --- Table 9 ---
642foreach name = ["half_cos",
643                "half_exp", "half_exp2", "half_exp10",
644                "half_log", "half_log2", "half_log10",
645                "half_recip", "half_rsqrt",
646                "half_sin", "half_sqrt", "half_tan",
647                "native_cos",
648                "native_exp", "native_exp2", "native_exp10",
649                "native_log", "native_log2", "native_log10",
650                "native_recip", "native_rsqrt",
651                "native_sin", "native_sqrt", "native_tan"] in {
652  def : Builtin<name, [GenTypeFloatVecAndScalar, GenTypeFloatVecAndScalar], Attr.Const>;
653}
654foreach name = ["half_divide", "half_powr",
655                "native_divide", "native_powr"] in {
656  def : Builtin<name, [GenTypeFloatVecAndScalar, GenTypeFloatVecAndScalar, GenTypeFloatVecAndScalar], Attr.Const>;
657}
658
659//--------------------------------------------------------------------
660// OpenCL v1.1 s6.11.3, v1.2 s6.12.3, v2.0 s6.13.3 - Integer Functions
661// --- Table 10 ---
662// --- 1 argument ---
663foreach name = ["abs"] in {
664  def : Builtin<name, [AI2UGenTypeN, AIGenTypeN], Attr.Const>;
665}
666def : Builtin<"clz", [AIGenTypeN, AIGenTypeN], Attr.Const>;
667let MinVersion = CL12 in {
668  def : Builtin<"popcount", [AIGenTypeN, AIGenTypeN], Attr.Const>;
669}
670let MinVersion = CL20 in {
671  foreach name = ["ctz"] in {
672    def : Builtin<name, [AIGenTypeN, AIGenTypeN], Attr.Const>;
673  }
674}
675
676// --- 2 arguments ---
677foreach name = ["abs_diff"] in {
678  def : Builtin<name, [AI2UGenTypeN, AIGenTypeN, AIGenTypeN], Attr.Const>;
679}
680foreach name = ["add_sat", "hadd", "rhadd", "mul_hi", "rotate", "sub_sat"] in {
681  def : Builtin<name, [AIGenTypeN, AIGenTypeN, AIGenTypeN], Attr.Const>;
682}
683foreach name = ["max", "min"] in {
684  def : Builtin<name, [AIGenTypeN, AIGenTypeN, AIGenTypeN], Attr.Const>;
685  def : Builtin<name, [AIGenTypeNNoScalar, AIGenTypeNNoScalar, AIGenType1], Attr.Const>;
686}
687foreach name = ["upsample"] in {
688  def : Builtin<name, [GenTypeShortVecAndScalar, GenTypeCharVecAndScalar, GenTypeUCharVecAndScalar], Attr.Const>;
689  def : Builtin<name, [GenTypeUShortVecAndScalar, GenTypeUCharVecAndScalar, GenTypeUCharVecAndScalar], Attr.Const>;
690  def : Builtin<name, [GenTypeIntVecAndScalar, GenTypeShortVecAndScalar, GenTypeUShortVecAndScalar], Attr.Const>;
691  def : Builtin<name, [GenTypeUIntVecAndScalar, GenTypeUShortVecAndScalar, GenTypeUShortVecAndScalar], Attr.Const>;
692  def : Builtin<name, [GenTypeLongVecAndScalar, GenTypeIntVecAndScalar, GenTypeUIntVecAndScalar], Attr.Const>;
693  def : Builtin<name, [GenTypeULongVecAndScalar, GenTypeUIntVecAndScalar, GenTypeUIntVecAndScalar], Attr.Const>;
694}
695
696// --- 3 arguments ---
697foreach name = ["clamp"] in {
698  def : Builtin<name, [AIGenTypeN, AIGenTypeN, AIGenTypeN, AIGenTypeN], Attr.Const>;
699  def : Builtin<name, [AIGenTypeNNoScalar, AIGenTypeNNoScalar, AIGenType1, AIGenType1], Attr.Const>;
700}
701foreach name = ["mad_hi", "mad_sat"] in {
702  def : Builtin<name, [AIGenTypeN, AIGenTypeN, AIGenTypeN, AIGenTypeN], Attr.Const>;
703}
704
705// --- Table 11 ---
706foreach name = ["mad24"] in {
707  def : Builtin<name, [GenTypeIntVecAndScalar, GenTypeIntVecAndScalar, GenTypeIntVecAndScalar, GenTypeIntVecAndScalar], Attr.Const>;
708  def : Builtin<name, [GenTypeUIntVecAndScalar, GenTypeUIntVecAndScalar, GenTypeUIntVecAndScalar, GenTypeUIntVecAndScalar], Attr.Const>;
709}
710foreach name = ["mul24"] in {
711  def : Builtin<name, [GenTypeIntVecAndScalar, GenTypeIntVecAndScalar, GenTypeIntVecAndScalar], Attr.Const>;
712  def : Builtin<name, [GenTypeUIntVecAndScalar, GenTypeUIntVecAndScalar, GenTypeUIntVecAndScalar], Attr.Const>;
713}
714
715//--------------------------------------------------------------------
716// OpenCL v1.1 s6.11.4, v1.2 s6.12.4, v2.0 s6.13.4 - Common Functions
717// OpenCL Extension v2.0 s5.1.3 and s6.1.3 - Common Functions
718// --- Table 12 ---
719// --- 1 argument ---
720foreach name = ["degrees", "radians", "sign"] in {
721  def : Builtin<name, [FGenTypeN, FGenTypeN], Attr.Const>;
722}
723
724// --- 2 arguments ---
725foreach name = ["max", "min"] in {
726  def : Builtin<name, [FGenTypeN, FGenTypeN, FGenTypeN], Attr.Const>;
727  def : Builtin<name, [GenTypeFloatVecNoScalar, GenTypeFloatVecNoScalar, Float], Attr.Const>;
728  def : Builtin<name, [GenTypeDoubleVecNoScalar, GenTypeDoubleVecNoScalar, Double], Attr.Const>;
729  def : Builtin<name, [GenTypeHalfVecNoScalar, GenTypeHalfVecNoScalar, Half], Attr.Const>;
730}
731foreach name = ["step"] in {
732  def : Builtin<name, [FGenTypeN, FGenTypeN, FGenTypeN], Attr.Const>;
733  def : Builtin<name, [GenTypeFloatVecNoScalar, Float, GenTypeFloatVecNoScalar], Attr.Const>;
734  def : Builtin<name, [GenTypeDoubleVecNoScalar, Double, GenTypeDoubleVecNoScalar], Attr.Const>;
735  def : Builtin<name, [GenTypeHalfVecNoScalar, Half, GenTypeHalfVecNoScalar], Attr.Const>;
736}
737
738// --- 3 arguments ---
739foreach name = ["clamp"] in {
740  def : Builtin<name, [FGenTypeN, FGenTypeN, FGenTypeN, FGenTypeN], Attr.Const>;
741  def : Builtin<name, [GenTypeFloatVecNoScalar, GenTypeFloatVecNoScalar, Float, Float], Attr.Const>;
742  def : Builtin<name, [GenTypeDoubleVecNoScalar, GenTypeDoubleVecNoScalar, Double, Double], Attr.Const>;
743  def : Builtin<name, [GenTypeHalfVecNoScalar, GenTypeHalfVecNoScalar, Half, Half], Attr.Const>;
744}
745foreach name = ["mix"] in {
746  def : Builtin<name, [FGenTypeN, FGenTypeN, FGenTypeN, FGenTypeN], Attr.Const>;
747  def : Builtin<name, [GenTypeFloatVecNoScalar, GenTypeFloatVecNoScalar, GenTypeFloatVecNoScalar, Float], Attr.Const>;
748  def : Builtin<name, [GenTypeDoubleVecNoScalar, GenTypeDoubleVecNoScalar, GenTypeDoubleVecNoScalar, Double], Attr.Const>;
749  def : Builtin<name, [GenTypeHalfVecNoScalar, GenTypeHalfVecNoScalar, GenTypeHalfVecNoScalar, Half], Attr.Const>;
750}
751foreach name = ["smoothstep"] in {
752  def : Builtin<name, [FGenTypeN, FGenTypeN, FGenTypeN, FGenTypeN], Attr.Const>;
753  def : Builtin<name, [GenTypeFloatVecNoScalar, Float, Float, GenTypeFloatVecNoScalar], Attr.Const>;
754  def : Builtin<name, [GenTypeDoubleVecNoScalar, Double, Double, GenTypeDoubleVecNoScalar], Attr.Const>;
755  def : Builtin<name, [GenTypeHalfVecNoScalar, Half, Half, GenTypeHalfVecNoScalar], Attr.Const>;
756}
757
758
759//--------------------------------------------------------------------
760// OpenCL v1.1 s6.11.5, v1.2 s6.12.5, v2.0 s6.13.5 - Geometric Functions
761// OpenCL Extension v2.0 s5.1.4 and s6.1.4 - Geometric Functions
762// --- Table 13 ---
763// --- 1 argument ---
764foreach name = ["length"] in {
765  def : Builtin<name, [Float, GenTypeFloatVec1234], Attr.Const>;
766  def : Builtin<name, [Double, GenTypeDoubleVec1234], Attr.Const>;
767  def : Builtin<name, [Half, GenTypeHalfVec1234], Attr.Const>;
768}
769foreach name = ["normalize"] in {
770  def : Builtin<name, [GenTypeFloatVec1234, GenTypeFloatVec1234], Attr.Const>;
771  def : Builtin<name, [GenTypeDoubleVec1234, GenTypeDoubleVec1234], Attr.Const>;
772  def : Builtin<name, [GenTypeHalfVec1234, GenTypeHalfVec1234], Attr.Const>;
773}
774foreach name = ["fast_length"] in {
775  def : Builtin<name, [Float, GenTypeFloatVec1234], Attr.Const>;
776}
777foreach name = ["fast_normalize"] in {
778  def : Builtin<name, [GenTypeFloatVec1234, GenTypeFloatVec1234], Attr.Const>;
779}
780
781// --- 2 arguments ---
782foreach name = ["cross"] in {
783  foreach VSize = [3, 4] in {
784    def : Builtin<name, [VectorType<Float, VSize>, VectorType<Float, VSize>, VectorType<Float, VSize>], Attr.Const>;
785    def : Builtin<name, [VectorType<Double, VSize>, VectorType<Double, VSize>, VectorType<Double, VSize>], Attr.Const>;
786    def : Builtin<name, [VectorType<Half, VSize>, VectorType<Half, VSize>, VectorType<Half, VSize>], Attr.Const>;
787  }
788}
789foreach name = ["dot", "distance"] in {
790  def : Builtin<name, [Float, GenTypeFloatVec1234, GenTypeFloatVec1234], Attr.Const>;
791  def : Builtin<name, [Double, GenTypeDoubleVec1234, GenTypeDoubleVec1234], Attr.Const>;
792  def : Builtin<name, [Half, GenTypeHalfVec1234, GenTypeHalfVec1234], Attr.Const>;
793}
794foreach name = ["fast_distance"] in {
795  def : Builtin<name, [Float, GenTypeFloatVec1234, GenTypeFloatVec1234], Attr.Const>;
796}
797
798
799//--------------------------------------------------------------------
800// OpenCL v1.1 s6.11.6, v1.2 s6.12.6, v2.0 s6.13.6 - Relational Functions
801// OpenCL Extension v2.0 s5.1.5 and s6.1.5 - Relational Functions
802// --- Table 14 ---
803// --- 1 argument ---
804foreach name = ["isfinite", "isinf", "isnan", "isnormal", "signbit"] in {
805  def : Builtin<name, [GenTypeIntVecAndScalar, GenTypeFloatVecAndScalar], Attr.Const>;
806  def : Builtin<name, [Int, Double], Attr.Const>;
807  def : Builtin<name, [GenTypeLongVecNoScalar, GenTypeDoubleVecNoScalar], Attr.Const>;
808  def : Builtin<name, [Int, Half], Attr.Const>;
809  def : Builtin<name, [GenTypeShortVecNoScalar, GenTypeHalfVecNoScalar], Attr.Const>;
810}
811foreach name = ["any", "all"] in {
812  def : Builtin<name, [Int, SGenTypeN], Attr.Const>;
813}
814
815// --- 2 arguments ---
816foreach name = ["isequal", "isnotequal", "isgreater", "isgreaterequal",
817                "isless", "islessequal", "islessgreater", "isordered",
818                "isunordered"] in {
819  def : Builtin<name, [GenTypeIntVecAndScalar, GenTypeFloatVecAndScalar, GenTypeFloatVecAndScalar], Attr.Const>;
820  def : Builtin<name, [Int, Double, Double], Attr.Const>;
821  def : Builtin<name, [GenTypeLongVecNoScalar, GenTypeDoubleVecNoScalar, GenTypeDoubleVecNoScalar], Attr.Const>;
822  def : Builtin<name, [Int, Half, Half], Attr.Const>;
823  def : Builtin<name, [GenTypeShortVecNoScalar, GenTypeHalfVecNoScalar, GenTypeHalfVecNoScalar], Attr.Const>;
824}
825
826// --- 3 arguments ---
827foreach name = ["bitselect"] in {
828  def : Builtin<name, [AGenTypeN, AGenTypeN, AGenTypeN, AGenTypeN], Attr.Const>;
829}
830foreach name = ["select"] in {
831  def : Builtin<name, [SGenTypeN, SGenTypeN, SGenTypeN, SGenTypeN], Attr.Const>;
832  def : Builtin<name, [SGenTypeN, SGenTypeN, SGenTypeN, UGenTypeN], Attr.Const>;
833  def : Builtin<name, [UGenTypeN, UGenTypeN, UGenTypeN, UGenTypeN], Attr.Const>;
834  def : Builtin<name, [UGenTypeN, UGenTypeN, UGenTypeN, SGenTypeN], Attr.Const>;
835  def : Builtin<name, [GenTypeFloatVecAndScalar, GenTypeFloatVecAndScalar, GenTypeFloatVecAndScalar, GenTypeIntVecAndScalar], Attr.Const>;
836  def : Builtin<name, [GenTypeFloatVecAndScalar, GenTypeFloatVecAndScalar, GenTypeFloatVecAndScalar, GenTypeUIntVecAndScalar], Attr.Const>;
837  def : Builtin<name, [GenTypeDoubleVecAndScalar, GenTypeDoubleVecAndScalar, GenTypeDoubleVecAndScalar, GenTypeLongVecAndScalar], Attr.Const>;
838  def : Builtin<name, [GenTypeDoubleVecAndScalar, GenTypeDoubleVecAndScalar, GenTypeDoubleVecAndScalar, GenTypeULongVecAndScalar], Attr.Const>;
839  def : Builtin<name, [GenTypeHalfVecAndScalar, GenTypeHalfVecAndScalar, GenTypeHalfVecAndScalar, GenTypeShortVecAndScalar], Attr.Const>;
840  def : Builtin<name, [GenTypeHalfVecAndScalar, GenTypeHalfVecAndScalar, GenTypeHalfVecAndScalar, GenTypeUShortVecAndScalar], Attr.Const>;
841}
842
843
844//--------------------------------------------------------------------
845// OpenCL v1.1 s6.11.7, v1.2 s6.12.7, v2.0 s6.13.7 - Vector Data Load and Store Functions
846// OpenCL Extension v1.1 s9.3.6 and s9.6.6, v1.2 s9.5.6, v2.0 s5.1.6 and s6.1.6 - Vector Data Load and Store Functions
847// --- Table 15 ---
848multiclass VloadVstore<list<AddressSpace> addrspaces, bit defStores> {
849  foreach AS = addrspaces in {
850    foreach VSize = [2, 3, 4, 8, 16] in {
851      foreach name = ["vload" # VSize] in {
852        def : Builtin<name, [VectorType<Char, VSize>, Size, PointerType<ConstType<Char>, AS>], Attr.Pure>;
853        def : Builtin<name, [VectorType<UChar, VSize>, Size, PointerType<ConstType<UChar>, AS>], Attr.Pure>;
854        def : Builtin<name, [VectorType<Short, VSize>, Size, PointerType<ConstType<Short>, AS>], Attr.Pure>;
855        def : Builtin<name, [VectorType<UShort, VSize>, Size, PointerType<ConstType<UShort>, AS>], Attr.Pure>;
856        def : Builtin<name, [VectorType<Int, VSize>, Size, PointerType<ConstType<Int>, AS>], Attr.Pure>;
857        def : Builtin<name, [VectorType<UInt, VSize>, Size, PointerType<ConstType<UInt>, AS>], Attr.Pure>;
858        def : Builtin<name, [VectorType<Long, VSize>, Size, PointerType<ConstType<Long>, AS>], Attr.Pure>;
859        def : Builtin<name, [VectorType<ULong, VSize>, Size, PointerType<ConstType<ULong>, AS>], Attr.Pure>;
860        def : Builtin<name, [VectorType<Float, VSize>, Size, PointerType<ConstType<Float>, AS>], Attr.Pure>;
861        def : Builtin<name, [VectorType<Double, VSize>, Size, PointerType<ConstType<Double>, AS>], Attr.Pure>;
862        def : Builtin<name, [VectorType<Half, VSize>, Size, PointerType<ConstType<Half>, AS>], Attr.Pure>;
863      }
864      if defStores then {
865        foreach name = ["vstore" # VSize] in {
866          def : Builtin<name, [Void, VectorType<Char, VSize>, Size, PointerType<Char, AS>]>;
867          def : Builtin<name, [Void, VectorType<UChar, VSize>, Size, PointerType<UChar, AS>]>;
868          def : Builtin<name, [Void, VectorType<Short, VSize>, Size, PointerType<Short, AS>]>;
869          def : Builtin<name, [Void, VectorType<UShort, VSize>, Size, PointerType<UShort, AS>]>;
870          def : Builtin<name, [Void, VectorType<Int, VSize>, Size, PointerType<Int, AS>]>;
871          def : Builtin<name, [Void, VectorType<UInt, VSize>, Size, PointerType<UInt, AS>]>;
872          def : Builtin<name, [Void, VectorType<Long, VSize>, Size, PointerType<Long, AS>]>;
873          def : Builtin<name, [Void, VectorType<ULong, VSize>, Size, PointerType<ULong, AS>]>;
874          def : Builtin<name, [Void, VectorType<Float, VSize>, Size, PointerType<Float, AS>]>;
875          def : Builtin<name, [Void, VectorType<Double, VSize>, Size, PointerType<Double, AS>]>;
876          def : Builtin<name, [Void, VectorType<Half, VSize>, Size, PointerType<Half, AS>]>;
877        }
878      }
879    }
880  }
881}
882
883let Extension = FuncExtOpenCLCNamedAddressSpaceBuiltins in {
884  defm : VloadVstore<[GlobalAS, LocalAS, PrivateAS], 1>;
885}
886let Extension = FuncExtOpenCLCGenericAddressSpace in {
887  defm : VloadVstore<[GenericAS], 1>;
888}
889// vload with constant address space is available regardless of version.
890defm : VloadVstore<[ConstantAS], 0>;
891
892multiclass VloadVstoreHalf<list<AddressSpace> addrspaces, bit defStores> {
893  foreach AS = addrspaces in {
894    def : Builtin<"vload_half", [Float, Size, !cast<Type>("HalfPtrConst" # AS)], Attr.Pure>;
895    foreach VSize = [2, 3, 4, 8, 16] in {
896      foreach name = ["vload_half" # VSize, "vloada_half" # VSize] in {
897        def : Builtin<name, [VectorType<Float, VSize>, Size, !cast<Type>("HalfPtrConst" # AS)], Attr.Pure>;
898      }
899    }
900    if defStores then {
901      foreach rnd = ["", "_rte", "_rtz", "_rtp", "_rtn"] in {
902        foreach name = ["vstore_half" # rnd] in {
903          def : Builtin<name, [Void, Float, Size, !cast<Type>("HalfPtr" # AS)]>;
904          def : Builtin<name, [Void, Double, Size, !cast<Type>("HalfPtr" # AS)]>;
905        }
906        foreach VSize = [2, 3, 4, 8, 16] in {
907          foreach name = ["vstore_half" # VSize # rnd, "vstorea_half" # VSize # rnd] in {
908            def : Builtin<name, [Void, VectorType<Float, VSize>, Size, !cast<Type>("HalfPtr" # AS)]>;
909            def : Builtin<name, [Void, VectorType<Double, VSize>, Size, !cast<Type>("HalfPtr" # AS)]>;
910          }
911        }
912      }
913    }
914  }
915}
916
917let Extension = FuncExtOpenCLCNamedAddressSpaceBuiltins in {
918  defm : VloadVstoreHalf<[GlobalAS, LocalAS, PrivateAS], 1>;
919}
920let Extension = FuncExtOpenCLCGenericAddressSpace in {
921  defm : VloadVstoreHalf<[GenericAS], 1>;
922}
923// vload_half and vloada_half with constant address space are available regardless of version.
924defm : VloadVstoreHalf<[ConstantAS], 0>;
925
926// OpenCL v3.0 s6.15.8 - Synchronization Functions.
927def : Builtin<"barrier", [Void, MemFenceFlags], Attr.Convergent>;
928let MinVersion = CL20 in {
929  def : Builtin<"work_group_barrier", [Void, MemFenceFlags], Attr.Convergent>;
930  def : Builtin<"work_group_barrier", [Void, MemFenceFlags, MemoryScope], Attr.Convergent>;
931}
932
933// OpenCL v3.0 s6.15.9 - Legacy Explicit Memory Fence Functions.
934def : Builtin<"mem_fence", [Void, MemFenceFlags]>;
935def : Builtin<"read_mem_fence", [Void, MemFenceFlags]>;
936def : Builtin<"write_mem_fence", [Void, MemFenceFlags]>;
937
938// OpenCL v3.0 s6.15.10 - Address Space Qualifier Functions.
939// to_global, to_local, to_private are declared in Builtins.td.
940
941let Extension = FuncExtOpenCLCGenericAddressSpace in {
942  // The OpenCL 3.0 specification defines these with a "gentype" argument indicating any builtin
943  // type or user-defined type, which cannot be represented currently.  Hence we slightly diverge
944  // by providing only the following overloads with a void pointer.
945  def : Builtin<"get_fence", [MemFenceFlags, PointerType<Void, GenericAS>]>;
946  def : Builtin<"get_fence", [MemFenceFlags, PointerType<ConstType<Void>, GenericAS>]>;
947}
948
949//--------------------------------------------------------------------
950// OpenCL v1.1 s6.11.10, v1.2 s6.12.10, v2.0 s6.13.10: Async Copies from Global to Local Memory, Local to Global Memory, and Prefetch
951// OpenCL Extension v2.0 s5.1.7 and s6.1.7: Async Copies from Global to Local Memory, Local to Global Memory, and Prefetch
952// --- Table 18 ---
953foreach name = ["async_work_group_copy"] in {
954  def : Builtin<name, [Event, PointerType<AGenTypeN, LocalAS>, PointerType<ConstType<AGenTypeN>, GlobalAS>, Size, Event]>;
955  def : Builtin<name, [Event, PointerType<AGenTypeN, GlobalAS>, PointerType<ConstType<AGenTypeN>, LocalAS>, Size, Event]>;
956}
957foreach name = ["async_work_group_strided_copy"] in {
958  def : Builtin<name, [Event, PointerType<AGenTypeN, LocalAS>, PointerType<ConstType<AGenTypeN>, GlobalAS>, Size, Size, Event]>;
959  def : Builtin<name, [Event, PointerType<AGenTypeN, GlobalAS>, PointerType<ConstType<AGenTypeN>, LocalAS>, Size, Size, Event]>;
960}
961foreach name = ["wait_group_events"] in {
962  def : Builtin<name, [Void, Int, PointerType<Event, GenericAS>]>;
963}
964foreach name = ["prefetch"] in {
965  def : Builtin<name, [Void, PointerType<ConstType<AGenTypeN>, GlobalAS>, Size]>;
966}
967
968//--------------------------------------------------------------------
969// OpenCL v2.0 s6.13.11 - Atomics Functions.
970// Functions that use memory_order and cl_mem_fence_flags enums are not
971// declared here as the TableGen backend does not handle enums.
972
973// OpenCL v1.0 s9.5, s9.6, s9.7 - Atomic Functions for 32-bit integers
974// --- Table 9.1 ---
975let Extension = FuncExtKhrGlobalInt32BaseAtomics in {
976  foreach Type = [Int, UInt] in {
977    foreach name = ["atom_add", "atom_sub", "atom_xchg"] in {
978      def : Builtin<name, [Type, PointerType<VolatileType<Type>, GlobalAS>, Type]>;
979    }
980    foreach name = ["atom_inc", "atom_dec"] in {
981      def : Builtin<name, [Type, PointerType<VolatileType<Type>, GlobalAS>]>;
982    }
983    foreach name = ["atom_cmpxchg"] in {
984      def : Builtin<name, [Type, PointerType<VolatileType<Type>, GlobalAS>, Type, Type]>;
985    }
986  }
987}
988// --- Table 9.3 ---
989let Extension = FuncExtKhrLocalInt32BaseAtomics in {
990  foreach Type = [Int, UInt] in {
991    foreach name = ["atom_add", "atom_sub", "atom_xchg"] in {
992      def : Builtin<name, [Type, PointerType<VolatileType<Type>, LocalAS>, Type]>;
993    }
994    foreach name = ["atom_inc", "atom_dec"] in {
995      def : Builtin<name, [Type, PointerType<VolatileType<Type>, LocalAS>]>;
996    }
997    foreach name = ["atom_cmpxchg"] in {
998      def : Builtin<name, [Type, PointerType<VolatileType<Type>, LocalAS>, Type, Type]>;
999    }
1000  }
1001}
1002// --- Table 9.5 ---
1003let Extension = FuncExtKhrInt64BaseAtomics in {
1004  foreach AS = [GlobalAS, LocalAS] in {
1005    foreach Type = [Long, ULong] in {
1006      foreach name = ["atom_add", "atom_sub", "atom_xchg"] in {
1007        def : Builtin<name, [Type, PointerType<VolatileType<Type>, AS>, Type]>;
1008      }
1009      foreach name = ["atom_inc", "atom_dec"] in {
1010        def : Builtin<name, [Type, PointerType<VolatileType<Type>, AS>]>;
1011      }
1012      foreach name = ["atom_cmpxchg"] in {
1013        def : Builtin<name, [Type, PointerType<VolatileType<Type>, AS>, Type, Type]>;
1014      }
1015    }
1016  }
1017}
1018// --- Table 9.2 ---
1019let Extension = FuncExtKhrGlobalInt32ExtendedAtomics in {
1020  foreach Type = [Int, UInt] in {
1021    foreach name = ["atom_min", "atom_max", "atom_and",
1022                    "atom_or", "atom_xor"] in {
1023      def : Builtin<name, [Type, PointerType<VolatileType<Type>, GlobalAS>, Type]>;
1024    }
1025  }
1026}
1027// --- Table 9.4 ---
1028let Extension = FuncExtKhrLocalInt32ExtendedAtomics in {
1029  foreach Type = [Int, UInt] in {
1030    foreach name = ["atom_min", "atom_max", "atom_and",
1031                    "atom_or", "atom_xor"] in {
1032      def : Builtin<name, [Type, PointerType<VolatileType<Type>, LocalAS>, Type]>;
1033    }
1034  }
1035}
1036// --- Table 9.6 ---
1037let Extension = FuncExtKhrInt64ExtendedAtomics in {
1038  foreach AS = [GlobalAS, LocalAS] in {
1039    foreach Type = [Long, ULong] in {
1040      foreach name = ["atom_min", "atom_max", "atom_and",
1041                      "atom_or", "atom_xor"] in {
1042        def : Builtin<name, [Type, PointerType<VolatileType<Type>, AS>, Type]>;
1043      }
1044    }
1045  }
1046}
1047// OpenCL v1.1 s6.11.1, v1.2 s6.12.11 - Atomic Functions
1048foreach AS = [GlobalAS, LocalAS] in {
1049  def : Builtin<"atomic_xchg", [Float, PointerType<VolatileType<Float>, AS>, Float]>;
1050  foreach Type = [Int, UInt] in {
1051    foreach name = ["atomic_add", "atomic_sub", "atomic_xchg",
1052                    "atomic_min", "atomic_max", "atomic_and",
1053                    "atomic_or", "atomic_xor"] in {
1054      def : Builtin<name, [Type, PointerType<VolatileType<Type>, AS>, Type]>;
1055    }
1056    foreach name = ["atomic_inc", "atomic_dec"] in {
1057      def : Builtin<name, [Type, PointerType<VolatileType<Type>, AS>]>;
1058    }
1059    foreach name = ["atomic_cmpxchg"] in {
1060      def : Builtin<name, [Type, PointerType<VolatileType<Type>, AS>, Type, Type]>;
1061    }
1062  }
1063}
1064
1065let Extension = FuncExtOpenCLCxx in {
1066  foreach Type = [Int, UInt] in {
1067    foreach name = ["atomic_add", "atomic_sub", "atomic_xchg",
1068                    "atomic_min", "atomic_max", "atomic_and",
1069                    "atomic_or", "atomic_xor"] in {
1070      def : Builtin<name, [Type, PointerType<VolatileType<Type>, GenericAS>, Type]>;
1071    }
1072    foreach name = ["atomic_inc", "atomic_dec"] in {
1073      def : Builtin<name, [Type, PointerType<VolatileType<Type>, GenericAS>]>;
1074    }
1075    foreach name = ["atomic_cmpxchg"] in {
1076      def : Builtin<name, [Type, PointerType<VolatileType<Type>, GenericAS>, Type, Type]>;
1077    }
1078  }
1079}
1080
1081// OpenCL v2.0 s6.13.11 - Atomic Functions.
1082
1083// An atomic builtin with 2 additional _explicit variants.
1084multiclass BuiltinAtomicExplicit<string Name, list<Type> Types, FunctionExtension BaseExt> {
1085  // Without explicit MemoryOrder or MemoryScope.
1086  let Extension = concatExtension<BaseExt, "__opencl_c_atomic_order_seq_cst __opencl_c_atomic_scope_device">.ret in {
1087    def : Builtin<Name, Types>;
1088  }
1089
1090  // With an explicit MemoryOrder argument.
1091  let Extension = concatExtension<BaseExt, "__opencl_c_atomic_scope_device">.ret in {
1092    def : Builtin<Name # "_explicit", !listconcat(Types, [MemoryOrder])>;
1093  }
1094
1095  // With explicit MemoryOrder and MemoryScope arguments.
1096  let Extension = BaseExt in {
1097    def : Builtin<Name # "_explicit", !listconcat(Types, [MemoryOrder, MemoryScope])>;
1098  }
1099}
1100
1101// OpenCL 2.0 atomic functions that have a pointer argument in a given address space.
1102multiclass OpenCL2Atomics<AddressSpace addrspace, FunctionExtension BaseExt> {
1103  foreach TypePair = [[AtomicInt, Int], [AtomicUInt, UInt],
1104                      [AtomicLong, Long], [AtomicULong, ULong],
1105                      [AtomicFloat, Float], [AtomicDouble, Double]] in {
1106    let Extension = BaseExt in {
1107      def : Builtin<"atomic_init",
1108          [Void, PointerType<VolatileType<TypePair[0]>, addrspace>, TypePair[1]]>;
1109    }
1110    defm : BuiltinAtomicExplicit<"atomic_store",
1111        [Void, PointerType<VolatileType<TypePair[0]>, addrspace>, TypePair[1]], BaseExt>;
1112    defm : BuiltinAtomicExplicit<"atomic_load",
1113        [TypePair[1], PointerType<VolatileType<TypePair[0]>, addrspace>], BaseExt>;
1114    defm : BuiltinAtomicExplicit<"atomic_exchange",
1115        [TypePair[1], PointerType<VolatileType<TypePair[0]>, addrspace>, TypePair[1]], BaseExt>;
1116    foreach Variant = ["weak", "strong"] in {
1117      foreach exp_ptr_addrspace = !cond(
1118            !eq(BaseExt, FuncExtOpenCLCGenericAddressSpace): [GenericAS],
1119            !eq(BaseExt, FuncExtOpenCLCNamedAddressSpaceBuiltins): [GlobalAS, LocalAS, PrivateAS])
1120          in {
1121        let Extension = concatExtension<BaseExt, "__opencl_c_atomic_order_seq_cst __opencl_c_atomic_scope_device">.ret in {
1122          def : Builtin<"atomic_compare_exchange_" # Variant,
1123              [Bool, PointerType<VolatileType<TypePair[0]>, addrspace>,
1124               PointerType<TypePair[1], exp_ptr_addrspace>, TypePair[1]]>;
1125        }
1126        let Extension = concatExtension<BaseExt, "__opencl_c_atomic_scope_device">.ret in {
1127          def : Builtin<"atomic_compare_exchange_" # Variant # "_explicit",
1128              [Bool, PointerType<VolatileType<TypePair[0]>, addrspace>,
1129               PointerType<TypePair[1], exp_ptr_addrspace>, TypePair[1], MemoryOrder, MemoryOrder]>;
1130        }
1131        let Extension = BaseExt in {
1132          def : Builtin<"atomic_compare_exchange_" # Variant # "_explicit",
1133              [Bool, PointerType<VolatileType<TypePair[0]>, addrspace>,
1134               PointerType<TypePair[1], exp_ptr_addrspace>, TypePair[1], MemoryOrder, MemoryOrder, MemoryScope]>;
1135        }
1136      }
1137    }
1138  }
1139
1140  foreach TypePair = [[AtomicInt, Int, Int], [AtomicUInt, UInt, UInt],
1141                      [AtomicLong, Long, Long], [AtomicULong, ULong, ULong],
1142                      [AtomicUIntPtr, UIntPtr, PtrDiff]] in {
1143    foreach ModOp = ["add", "sub"] in {
1144      defm : BuiltinAtomicExplicit<"atomic_fetch_" # ModOp,
1145          [TypePair[1], PointerType<VolatileType<TypePair[0]>, addrspace>, TypePair[2]], BaseExt>;
1146    }
1147  }
1148  foreach TypePair = [[AtomicInt, Int, Int], [AtomicUInt, UInt, UInt],
1149                      [AtomicLong, Long, Long], [AtomicULong, ULong, ULong]] in {
1150    foreach ModOp = ["or", "xor", "and", "min", "max"] in {
1151      defm : BuiltinAtomicExplicit<"atomic_fetch_" # ModOp,
1152          [TypePair[1], PointerType<VolatileType<TypePair[0]>, addrspace>, TypePair[2]], BaseExt>;
1153    }
1154  }
1155
1156  defm : BuiltinAtomicExplicit<"atomic_flag_clear",
1157      [Void, PointerType<VolatileType<AtomicFlag>, addrspace>], BaseExt>;
1158
1159  defm : BuiltinAtomicExplicit<"atomic_flag_test_and_set",
1160      [Bool, PointerType<VolatileType<AtomicFlag>, addrspace>], BaseExt>;
1161}
1162
1163let MinVersion = CL20 in {
1164  def : Builtin<"atomic_work_item_fence", [Void, MemFenceFlags, MemoryOrder, MemoryScope]>;
1165
1166  defm : OpenCL2Atomics<GenericAS, FuncExtOpenCLCGenericAddressSpace>;
1167  defm : OpenCL2Atomics<GlobalAS, FuncExtOpenCLCNamedAddressSpaceBuiltins>;
1168  defm : OpenCL2Atomics<LocalAS, FuncExtOpenCLCNamedAddressSpaceBuiltins>;
1169}
1170
1171// The functionality added by cl_ext_float_atomics extension
1172let MinVersion = CL20 in {
1173  foreach addrspace = [GlobalAS, LocalAS, GenericAS] in {
1174    defvar extension_fp16 = !cast<FunctionExtension>("FuncExtFloatAtomicsFp16" # addrspace # "LoadStore");
1175
1176    defm : BuiltinAtomicExplicit<"atomic_store",
1177        [Void, PointerType<VolatileType<AtomicHalf>, addrspace>, AtomicHalf], extension_fp16>;
1178    defm : BuiltinAtomicExplicit<"atomic_load",
1179        [Half, PointerType<VolatileType<AtomicHalf>, addrspace>], extension_fp16>;
1180    defm : BuiltinAtomicExplicit<"atomic_exchange",
1181        [Half, PointerType<VolatileType<AtomicHalf>, addrspace>, Half], extension_fp16>;
1182
1183    foreach ModOp = ["add", "sub"] in {
1184      defvar extension_fp16 = !cast<FunctionExtension>("FuncExtFloatAtomicsFp16" # addrspace # "Add");
1185      defvar extension_fp32 = !cast<FunctionExtension>("FuncExtFloatAtomicsFp32" # addrspace # "Add");
1186      defvar extension_fp64 = !cast<FunctionExtension>("FuncExtFloatAtomicsFp64" # addrspace # "Add");
1187
1188      defm : BuiltinAtomicExplicit<"atomic_fetch_" # ModOp,
1189          [Half, PointerType<VolatileType<AtomicHalf>, addrspace>, Half], extension_fp16>;
1190      defm : BuiltinAtomicExplicit<"atomic_fetch_" # ModOp,
1191          [Float, PointerType<VolatileType<AtomicFloat>, addrspace>, Float], extension_fp32>;
1192      defm : BuiltinAtomicExplicit<"atomic_fetch_" # ModOp,
1193          [Double, PointerType<VolatileType<AtomicDouble>, addrspace>, Double], extension_fp64>;
1194    }
1195
1196    foreach ModOp = ["min", "max"] in {
1197      defvar extension_fp16 = !cast<FunctionExtension>("FuncExtFloatAtomicsFp16" # addrspace # "MinMax");
1198      defvar extension_fp32 = !cast<FunctionExtension>("FuncExtFloatAtomicsFp32" # addrspace # "MinMax");
1199      defvar extension_fp64 = !cast<FunctionExtension>("FuncExtFloatAtomicsFp64" # addrspace # "MinMax");
1200
1201      defm : BuiltinAtomicExplicit<"atomic_fetch_" # ModOp,
1202          [Half, PointerType<VolatileType<AtomicHalf>, addrspace>, Half], extension_fp16>;
1203      defm : BuiltinAtomicExplicit<"atomic_fetch_" # ModOp,
1204          [Float, PointerType<VolatileType<AtomicFloat>, addrspace>, Float], extension_fp32>;
1205      defm : BuiltinAtomicExplicit<"atomic_fetch_" # ModOp,
1206          [Double, PointerType<VolatileType<AtomicDouble>, addrspace>, Double], extension_fp64>;
1207    }
1208  }
1209}
1210
1211//--------------------------------------------------------------------
1212// OpenCL v1.1 s6.11.12, v1.2 s6.12.12, v2.0 s6.13.12 - Miscellaneous Vector Functions
1213// --- Table 19 ---
1214foreach VSize1 = [2, 4, 8, 16] in {
1215  foreach VSize2 = [2, 4, 8, 16] in {
1216    foreach VecAndMaskType = [[Char, UChar], [UChar, UChar],
1217                              [Short, UShort], [UShort, UShort],
1218                              [Int, UInt], [UInt, UInt],
1219                              [Long, ULong], [ULong, ULong],
1220                              [Float, UInt], [Double, ULong], [Half, UShort]] in {
1221      def : Builtin<"shuffle", [VectorType<VecAndMaskType[0], VSize1>,
1222                                VectorType<VecAndMaskType[0], VSize2>,
1223                                VectorType<VecAndMaskType[1], VSize1>],
1224                               Attr.Const>;
1225    }
1226  }
1227}
1228foreach VSize1 = [2, 4, 8, 16] in {
1229  foreach VSize2 = [2, 4, 8, 16] in {
1230    foreach VecAndMaskType = [[Char, UChar], [UChar, UChar],
1231                              [Short, UShort], [UShort, UShort],
1232                              [Int, UInt], [UInt, UInt],
1233                              [Long, ULong], [ULong, ULong],
1234                              [Float, UInt], [Double, ULong], [Half, UShort]] in {
1235      def : Builtin<"shuffle2", [VectorType<VecAndMaskType[0], VSize1>,
1236                                 VectorType<VecAndMaskType[0], VSize2>,
1237                                 VectorType<VecAndMaskType[0], VSize2>,
1238                                 VectorType<VecAndMaskType[1], VSize1>],
1239                                Attr.Const>;
1240    }
1241  }
1242}
1243
1244//--------------------------------------------------------------------
1245// OpenCL v1.1 s6.11.3, v1.2 s6.12.14, v2.0 s6.13.14: Image Read and Write Functions
1246// OpenCL Extension v2.0 s5.1.8 and s6.1.8: Image Read and Write Functions
1247// --- Table 22: Image Read Functions with Samplers ---
1248foreach imgTy = [Image1d] in {
1249  foreach coordTy = [Int, Float] in {
1250    def : Builtin<"read_imagef", [VectorType<Float, 4>, ImageType<imgTy, "RO">, Sampler, coordTy], Attr.Pure>;
1251    def : Builtin<"read_imagei", [VectorType<Int, 4>, ImageType<imgTy, "RO">, Sampler, coordTy], Attr.Pure>;
1252    def : Builtin<"read_imageui", [VectorType<UInt, 4>, ImageType<imgTy, "RO">, Sampler, coordTy], Attr.Pure>;
1253  }
1254}
1255foreach imgTy = [Image2d, Image1dArray] in {
1256  foreach coordTy = [Int, Float] in {
1257    def : Builtin<"read_imagef", [VectorType<Float, 4>, ImageType<imgTy, "RO">, Sampler, VectorType<coordTy, 2>], Attr.Pure>;
1258    def : Builtin<"read_imagei", [VectorType<Int, 4>, ImageType<imgTy, "RO">, Sampler, VectorType<coordTy, 2>], Attr.Pure>;
1259    def : Builtin<"read_imageui", [VectorType<UInt, 4>, ImageType<imgTy, "RO">, Sampler, VectorType<coordTy, 2>], Attr.Pure>;
1260  }
1261}
1262foreach imgTy = [Image3d, Image2dArray] in {
1263  foreach coordTy = [Int, Float] in {
1264    def : Builtin<"read_imagef", [VectorType<Float, 4>, ImageType<imgTy, "RO">, Sampler, VectorType<coordTy, 4>], Attr.Pure>;
1265    def : Builtin<"read_imagei", [VectorType<Int, 4>, ImageType<imgTy, "RO">, Sampler, VectorType<coordTy, 4>], Attr.Pure>;
1266    def : Builtin<"read_imageui", [VectorType<UInt, 4>, ImageType<imgTy, "RO">, Sampler, VectorType<coordTy, 4>], Attr.Pure>;
1267  }
1268}
1269foreach coordTy = [Int, Float] in {
1270  def : Builtin<"read_imagef", [Float, ImageType<Image2dDepth, "RO">, Sampler, VectorType<coordTy, 2>], Attr.Pure>;
1271  def : Builtin<"read_imagef", [Float, ImageType<Image2dArrayDepth, "RO">, Sampler, VectorType<coordTy, 4>], Attr.Pure>;
1272}
1273
1274// --- Table 23: Sampler-less Read Functions ---
1275multiclass ImageReadSamplerless<string aQual> {
1276  foreach imgTy = [Image2d, Image1dArray] in {
1277    def : Builtin<"read_imagef", [VectorType<Float, 4>, ImageType<imgTy, aQual>, VectorType<Int, 2>], Attr.Pure>;
1278    def : Builtin<"read_imagei", [VectorType<Int, 4>, ImageType<imgTy, aQual>, VectorType<Int, 2>], Attr.Pure>;
1279    def : Builtin<"read_imageui", [VectorType<UInt, 4>, ImageType<imgTy, aQual>, VectorType<Int, 2>], Attr.Pure>;
1280  }
1281  foreach imgTy = [Image3d, Image2dArray] in {
1282    def : Builtin<"read_imagef", [VectorType<Float, 4>, ImageType<imgTy, aQual>, VectorType<Int, 4>], Attr.Pure>;
1283    def : Builtin<"read_imagei", [VectorType<Int, 4>, ImageType<imgTy, aQual>, VectorType<Int, 4>], Attr.Pure>;
1284    def : Builtin<"read_imageui", [VectorType<UInt, 4>, ImageType<imgTy, aQual>, VectorType<Int, 4>], Attr.Pure>;
1285  }
1286  foreach imgTy = [Image1d, Image1dBuffer] in {
1287    def : Builtin<"read_imagef", [VectorType<Float, 4>, ImageType<imgTy, aQual>, Int], Attr.Pure>;
1288    def : Builtin<"read_imagei", [VectorType<Int, 4>, ImageType<imgTy, aQual>, Int], Attr.Pure>;
1289    def : Builtin<"read_imageui", [VectorType<UInt, 4>, ImageType<imgTy, aQual>, Int], Attr.Pure>;
1290  }
1291  def : Builtin<"read_imagef", [Float, ImageType<Image2dDepth, aQual>, VectorType<Int, 2>], Attr.Pure>;
1292  def : Builtin<"read_imagef", [Float, ImageType<Image2dArrayDepth, aQual>, VectorType<Int, 4>], Attr.Pure>;
1293}
1294
1295let MinVersion = CL12 in {
1296  defm : ImageReadSamplerless<"RO">;
1297  let Extension = FuncExtOpenCLCReadWriteImages in {
1298    defm : ImageReadSamplerless<"RW">;
1299  }
1300}
1301
1302// --- Table 24: Image Write Functions ---
1303multiclass ImageWrite<string aQual> {
1304  foreach imgTy = [Image2d] in {
1305    def : Builtin<"write_imagef", [Void, ImageType<imgTy, aQual>, VectorType<Int, 2>, VectorType<Float, 4>]>;
1306    def : Builtin<"write_imagei", [Void, ImageType<imgTy, aQual>, VectorType<Int, 2>, VectorType<Int, 4>]>;
1307    def : Builtin<"write_imageui", [Void, ImageType<imgTy, aQual>, VectorType<Int, 2>, VectorType<UInt, 4>]>;
1308  }
1309  foreach imgTy = [Image2dArray] in {
1310    def : Builtin<"write_imagef", [Void, ImageType<imgTy, aQual>, VectorType<Int, 4>, VectorType<Float, 4>]>;
1311    def : Builtin<"write_imagei", [Void, ImageType<imgTy, aQual>, VectorType<Int, 4>, VectorType<Int, 4>]>;
1312    def : Builtin<"write_imageui", [Void, ImageType<imgTy, aQual>, VectorType<Int, 4>, VectorType<UInt, 4>]>;
1313  }
1314  foreach imgTy = [Image1d, Image1dBuffer] in {
1315    def : Builtin<"write_imagef", [Void, ImageType<imgTy, aQual>, Int, VectorType<Float, 4>]>;
1316    def : Builtin<"write_imagei", [Void, ImageType<imgTy, aQual>, Int, VectorType<Int, 4>]>;
1317    def : Builtin<"write_imageui", [Void, ImageType<imgTy, aQual>, Int, VectorType<UInt, 4>]>;
1318  }
1319  foreach imgTy = [Image1dArray] in {
1320    def : Builtin<"write_imagef", [Void, ImageType<imgTy, aQual>, VectorType<Int, 2>, VectorType<Float, 4>]>;
1321    def : Builtin<"write_imagei", [Void, ImageType<imgTy, aQual>, VectorType<Int, 2>, VectorType<Int, 4>]>;
1322    def : Builtin<"write_imageui", [Void, ImageType<imgTy, aQual>, VectorType<Int, 2>, VectorType<UInt, 4>]>;
1323  }
1324  foreach imgTy = [Image3d] in {
1325    def : Builtin<"write_imagef", [Void, ImageType<imgTy, aQual>, VectorType<Int, 4>, VectorType<Float, 4>]>;
1326    def : Builtin<"write_imagei", [Void, ImageType<imgTy, aQual>, VectorType<Int, 4>, VectorType<Int, 4>]>;
1327    def : Builtin<"write_imageui", [Void, ImageType<imgTy, aQual>, VectorType<Int, 4>, VectorType<UInt, 4>]>;
1328  }
1329  def : Builtin<"write_imagef", [Void, ImageType<Image2dDepth, aQual>, VectorType<Int, 2>, Float]>;
1330  def : Builtin<"write_imagef", [Void, ImageType<Image2dArrayDepth, aQual>, VectorType<Int, 4>, Float]>;
1331}
1332
1333defm : ImageWrite<"WO">;
1334let Extension = FuncExtOpenCLCReadWriteImages in {
1335  defm : ImageWrite<"RW">;
1336}
1337
1338// --- Table 25: Image Query Functions ---
1339multiclass ImageQuery<string aQual> {
1340  foreach imgTy = [Image1d, Image1dBuffer, Image2d, Image3d,
1341                   Image1dArray, Image2dArray, Image2dDepth,
1342                   Image2dArrayDepth] in {
1343    foreach name = ["get_image_width", "get_image_channel_data_type",
1344                    "get_image_channel_order"] in {
1345      def : Builtin<name, [Int, ImageType<imgTy, aQual>], Attr.Const>;
1346    }
1347  }
1348  foreach imgTy = [Image2d, Image3d, Image2dArray, Image2dDepth,
1349                   Image2dArrayDepth] in {
1350    def : Builtin<"get_image_height", [Int, ImageType<imgTy, aQual>], Attr.Const>;
1351  }
1352  def : Builtin<"get_image_depth", [Int, ImageType<Image3d, aQual>], Attr.Const>;
1353  foreach imgTy = [Image2d, Image2dArray, Image2dDepth,
1354                   Image2dArrayDepth] in {
1355    def : Builtin<"get_image_dim", [VectorType<Int, 2>, ImageType<imgTy, aQual>], Attr.Const>;
1356  }
1357  def : Builtin<"get_image_dim", [VectorType<Int, 4>, ImageType<Image3d, aQual>], Attr.Const>;
1358  foreach imgTy = [Image1dArray, Image2dArray, Image2dArrayDepth] in {
1359    def : Builtin<"get_image_array_size", [Size, ImageType<imgTy, aQual>], Attr.Const>;
1360  }
1361}
1362
1363defm : ImageQuery<"RO">;
1364defm : ImageQuery<"WO">;
1365let Extension = FuncExtOpenCLCReadWriteImages in {
1366  defm : ImageQuery<"RW">;
1367}
1368
1369// OpenCL extension v2.0 s5.1.9: Built-in Image Read Functions
1370// --- Table 8 ---
1371foreach aQual = ["RO"] in {
1372  foreach name = ["read_imageh"] in {
1373    foreach coordTy = [Int, Float] in {
1374      foreach imgTy = [Image2d, Image1dArray] in {
1375        def : Builtin<name, [VectorType<Half, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<coordTy, 2>], Attr.Pure>;
1376      }
1377      foreach imgTy = [Image3d, Image2dArray] in {
1378        def : Builtin<name, [VectorType<Half, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<coordTy, 4>], Attr.Pure>;
1379      }
1380      foreach imgTy = [Image1d] in {
1381        def : Builtin<name, [VectorType<Half, 4>, ImageType<imgTy, aQual>, Sampler, coordTy], Attr.Pure>;
1382      }
1383    }
1384  }
1385}
1386// OpenCL extension v2.0 s5.1.10: Built-in Image Sampler-less Read Functions
1387// --- Table 9 ---
1388let MinVersion = CL12 in {
1389  multiclass ImageReadHalf<string aQual> {
1390    foreach name = ["read_imageh"] in {
1391      foreach imgTy = [Image2d, Image1dArray] in {
1392        def : Builtin<name, [VectorType<Half, 4>, ImageType<imgTy, aQual>, VectorType<Int, 2>], Attr.Pure>;
1393      }
1394      foreach imgTy = [Image3d, Image2dArray] in {
1395        def : Builtin<name, [VectorType<Half, 4>, ImageType<imgTy, aQual>, VectorType<Int, 4>], Attr.Pure>;
1396      }
1397      foreach imgTy = [Image1d, Image1dBuffer] in {
1398        def : Builtin<name, [VectorType<Half, 4>, ImageType<imgTy, aQual>, Int], Attr.Pure>;
1399      }
1400    }
1401  }
1402  defm : ImageReadHalf<"RO">;
1403  let Extension = FuncExtOpenCLCReadWriteImages in {
1404    defm : ImageReadHalf<"RW">;
1405  }
1406}
1407// OpenCL extension v2.0 s5.1.11: Built-in Image Write Functions
1408// --- Table 10 ---
1409multiclass ImageWriteHalf<string aQual> {
1410  foreach name = ["write_imageh"] in {
1411    def : Builtin<name, [Void, ImageType<Image2d, aQual>, VectorType<Int, 2>, VectorType<Half, 4>]>;
1412    def : Builtin<name, [Void, ImageType<Image2dArray, aQual>, VectorType<Int, 4>, VectorType<Half, 4>]>;
1413    def : Builtin<name, [Void, ImageType<Image1d, aQual>, Int, VectorType<Half, 4>]>;
1414    def : Builtin<name, [Void, ImageType<Image1dBuffer, aQual>, Int, VectorType<Half, 4>]>;
1415    def : Builtin<name, [Void, ImageType<Image1dArray, aQual>, VectorType<Int, 2>, VectorType<Half, 4>]>;
1416    def : Builtin<name, [Void, ImageType<Image3d, aQual>, VectorType<Int, 4>, VectorType<Half, 4>]>;
1417  }
1418}
1419
1420defm : ImageWriteHalf<"WO">;
1421let Extension = FuncExtOpenCLCReadWriteImages in {
1422  defm : ImageWriteHalf<"RW">;
1423}
1424
1425
1426
1427//--------------------------------------------------------------------
1428// OpenCL v2.0 s6.13.15 - Work-group Functions
1429// --- Table 26 ---
1430let Extension = FuncExtOpenCLCWGCollectiveFunctions in {
1431  foreach name = ["work_group_all", "work_group_any"] in {
1432    def : Builtin<name, [Int, Int], Attr.Convergent>;
1433  }
1434  foreach name = ["work_group_broadcast"] in {
1435    def : Builtin<name, [IntLongFloatGenType1, IntLongFloatGenType1, Size], Attr.Convergent>;
1436    def : Builtin<name, [IntLongFloatGenType1, IntLongFloatGenType1, Size, Size], Attr.Convergent>;
1437    def : Builtin<name, [IntLongFloatGenType1, IntLongFloatGenType1, Size, Size, Size], Attr.Convergent>;
1438  }
1439  foreach op = ["add", "min", "max"] in {
1440    foreach name = ["work_group_reduce_", "work_group_scan_exclusive_",
1441                    "work_group_scan_inclusive_"] in {
1442      def : Builtin<name # op, [IntLongFloatGenType1, IntLongFloatGenType1], Attr.Convergent>;
1443    }
1444  }
1445}
1446
1447
1448//--------------------------------------------------------------------
1449// OpenCL2.0 : 6.13.16 : Pipe Functions
1450// --- Table 27 ---
1451// Defined in Builtins.td
1452
1453// --- Table 28 ---
1454// Builtins taking pipe arguments are defined in Builtins.td
1455let Extension = FuncExtOpenCLCPipes in {
1456  def : Builtin<"is_valid_reserve_id", [Bool, ReserveId]>;
1457}
1458
1459// --- Table 29 ---
1460// Defined in Builtins.td
1461
1462
1463//--------------------------------------------------------------------
1464// OpenCL2.0 : 6.13.17 : Enqueuing Kernels
1465// --- Table 30 ---
1466// Defined in Builtins.td
1467
1468// --- Table 32 ---
1469// Defined in Builtins.td
1470
1471// --- Table 33 ---
1472let Extension = FuncExtOpenCLCDeviceEnqueue in {
1473  def : Builtin<"enqueue_marker",
1474      [Int, Queue, UInt, PointerType<ConstType<ClkEvent>, GenericAS>, PointerType<ClkEvent, GenericAS>]>;
1475
1476  // --- Table 34 ---
1477  def : Builtin<"retain_event", [Void, ClkEvent]>;
1478  def : Builtin<"release_event", [Void, ClkEvent]>;
1479  def : Builtin<"create_user_event", [ClkEvent]>;
1480  def : Builtin<"is_valid_event", [Bool, ClkEvent]>;
1481  def : Builtin<"set_user_event_status", [Void, ClkEvent, Int]>;
1482  def : Builtin<"capture_event_profiling_info",
1483      [Void, ClkEvent, ClkProfilingInfo, PointerType<Void, GlobalAS>]>;
1484
1485  // --- Table 35 ---
1486  def : Builtin<"get_default_queue", [Queue]>;
1487
1488  def : Builtin<"ndrange_1D", [NDRange, Size]>;
1489  def : Builtin<"ndrange_1D", [NDRange, Size, Size]>;
1490  def : Builtin<"ndrange_1D", [NDRange, Size, Size, Size]>;
1491  def : Builtin<"ndrange_2D", [NDRange, PointerType<ConstType<Size>, PrivateAS>]>;
1492  def : Builtin<"ndrange_2D", [NDRange, PointerType<ConstType<Size>, PrivateAS>,
1493                                        PointerType<ConstType<Size>, PrivateAS>]>;
1494  def : Builtin<"ndrange_2D", [NDRange, PointerType<ConstType<Size>, PrivateAS>,
1495                                        PointerType<ConstType<Size>, PrivateAS>,
1496                                        PointerType<ConstType<Size>, PrivateAS>]>;
1497  def : Builtin<"ndrange_3D", [NDRange, PointerType<ConstType<Size>, PrivateAS>]>;
1498  def : Builtin<"ndrange_3D", [NDRange, PointerType<ConstType<Size>, PrivateAS>,
1499                                        PointerType<ConstType<Size>, PrivateAS>]>;
1500  def : Builtin<"ndrange_3D", [NDRange, PointerType<ConstType<Size>, PrivateAS>,
1501                                        PointerType<ConstType<Size>, PrivateAS>,
1502                                        PointerType<ConstType<Size>, PrivateAS>]>;
1503}
1504
1505
1506//--------------------------------------------------------------------
1507// End of the builtin functions defined in the OpenCL C specification.
1508// Builtin functions defined in the OpenCL C Extension are below.
1509//--------------------------------------------------------------------
1510
1511
1512// OpenCL Extension v2.0 s9.18 - Mipmaps
1513let Extension = FuncExtKhrMipmapImage in {
1514  // Added to section 6.13.14.2.
1515  foreach aQual = ["RO"] in {
1516    foreach imgTy = [Image2d] in {
1517      foreach name = ["read_imagef"] in {
1518        def : Builtin<name, [VectorType<Float, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 2>, Float], Attr.Pure>;
1519        def : Builtin<name, [VectorType<Float, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 2>, VectorType<Float, 2>, VectorType<Float, 2>], Attr.Pure>;
1520      }
1521      foreach name = ["read_imagei"] in {
1522        def : Builtin<name, [VectorType<Int, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 2>, Float], Attr.Pure>;
1523        def : Builtin<name, [VectorType<Int, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 2>, VectorType<Float, 2>, VectorType<Float, 2>], Attr.Pure>;
1524      }
1525      foreach name = ["read_imageui"] in {
1526        def : Builtin<name, [VectorType<UInt, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 2>, Float], Attr.Pure>;
1527        def : Builtin<name, [VectorType<UInt, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 2>, VectorType<Float, 2>, VectorType<Float, 2>], Attr.Pure>;
1528      }
1529    }
1530    foreach imgTy = [Image2dDepth] in {
1531      foreach name = ["read_imagef"] in {
1532        def : Builtin<name, [Float, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 2>, Float], Attr.Pure>;
1533        def : Builtin<name, [Float, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 2>, VectorType<Float, 2>, VectorType<Float, 2>], Attr.Pure>;
1534      }
1535    }
1536    foreach imgTy = [Image1d] in {
1537      foreach name = ["read_imagef"] in {
1538        def : Builtin<name, [VectorType<Float, 4>, ImageType<imgTy, aQual>, Sampler, Float, Float], Attr.Pure>;
1539        def : Builtin<name, [VectorType<Float, 4>, ImageType<imgTy, aQual>, Sampler, Float, Float, Float], Attr.Pure>;
1540      }
1541      foreach name = ["read_imagei"] in {
1542        def : Builtin<name, [VectorType<Int, 4>, ImageType<imgTy, aQual>, Sampler, Float, Float], Attr.Pure>;
1543        def : Builtin<name, [VectorType<Int, 4>, ImageType<imgTy, aQual>, Sampler, Float, Float, Float], Attr.Pure>;
1544      }
1545      foreach name = ["read_imageui"] in {
1546        def : Builtin<name, [VectorType<UInt, 4>, ImageType<imgTy, aQual>, Sampler, Float, Float], Attr.Pure>;
1547        def : Builtin<name, [VectorType<UInt, 4>, ImageType<imgTy, aQual>, Sampler, Float, Float, Float], Attr.Pure>;
1548      }
1549    }
1550    foreach imgTy = [Image3d] in {
1551      foreach name = ["read_imagef"] in {
1552        def : Builtin<name, [VectorType<Float, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 4>, VectorType<Float, 4>, VectorType<Float, 4>], Attr.Pure>;
1553        def : Builtin<name, [VectorType<Float, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 4>, Float], Attr.Pure>;
1554      }
1555      foreach name = ["read_imagei"] in {
1556        def : Builtin<name, [VectorType<Int, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 4>, VectorType<Float, 4>, VectorType<Float, 4>], Attr.Pure>;
1557        def : Builtin<name, [VectorType<Int, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 4>, Float], Attr.Pure>;
1558      }
1559      foreach name = ["read_imageui"] in {
1560        def : Builtin<name, [VectorType<UInt, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 4>, VectorType<Float, 4>, VectorType<Float, 4>], Attr.Pure>;
1561        def : Builtin<name, [VectorType<UInt, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 4>, Float], Attr.Pure>;
1562      }
1563    }
1564    foreach imgTy = [Image1dArray] in {
1565      foreach name = ["read_imagef"] in {
1566        def : Builtin<name, [VectorType<Float, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 2>, Float], Attr.Pure>;
1567        def : Builtin<name, [VectorType<Float, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 2>, Float, Float], Attr.Pure>;
1568      }
1569      foreach name = ["read_imagei"] in {
1570        def : Builtin<name, [VectorType<Int, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 2>, Float], Attr.Pure>;
1571        def : Builtin<name, [VectorType<Int, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 2>, Float, Float], Attr.Pure>;
1572      }
1573      foreach name = ["read_imageui"] in {
1574        def : Builtin<name, [VectorType<UInt, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 2>, Float], Attr.Pure>;
1575        def : Builtin<name, [VectorType<UInt, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 2>, Float, Float], Attr.Pure>;
1576      }
1577    }
1578    foreach imgTy = [Image2dArray] in {
1579      foreach name = ["read_imagef"] in {
1580        def : Builtin<name, [VectorType<Float, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 4>, Float], Attr.Pure>;
1581        def : Builtin<name, [VectorType<Float, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 4>, VectorType<Float, 2>, VectorType<Float, 2>], Attr.Pure>;
1582      }
1583      foreach name = ["read_imagei"] in {
1584        def : Builtin<name, [VectorType<Int, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 4>, Float], Attr.Pure>;
1585        def : Builtin<name, [VectorType<Int, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 4>, VectorType<Float, 2>, VectorType<Float, 2>], Attr.Pure>;
1586      }
1587      foreach name = ["read_imageui"] in {
1588        def : Builtin<name, [VectorType<UInt, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 4>, Float], Attr.Pure>;
1589        def : Builtin<name, [VectorType<UInt, 4>, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 4>, VectorType<Float, 2>, VectorType<Float, 2>], Attr.Pure>;
1590      }
1591    }
1592    foreach imgTy = [Image2dArrayDepth] in {
1593      foreach name = ["read_imagef"] in {
1594        def : Builtin<name, [Float, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 4>, Float], Attr.Pure>;
1595        def : Builtin<name, [Float, ImageType<imgTy, aQual>, Sampler, VectorType<Float, 4>, VectorType<Float, 2>, VectorType<Float, 2>], Attr.Pure>;
1596      }
1597    }
1598  }
1599}
1600
1601// Added to section 6.13.14.5
1602multiclass ImageQueryNumMipLevels<string aQual> {
1603  foreach imgTy = [Image1d, Image2d, Image3d, Image1dArray, Image2dArray, Image2dDepth, Image2dArrayDepth] in {
1604    def : Builtin<"get_image_num_mip_levels", [Int, ImageType<imgTy, aQual>]>;
1605  }
1606}
1607
1608let Extension = FuncExtKhrMipmapImage in {
1609  defm : ImageQueryNumMipLevels<"RO">;
1610  defm : ImageQueryNumMipLevels<"WO">;
1611  defm : ImageQueryNumMipLevels<"RW">;
1612}
1613
1614// Write functions are enabled using a separate extension.
1615let Extension = FuncExtKhrMipmapImageWrites in {
1616  // Added to section 6.13.14.4.
1617  foreach aQual = ["WO"] in {
1618    foreach imgTy = [Image2d] in {
1619      def : Builtin<"write_imagef", [Void, ImageType<imgTy, aQual>, VectorType<Int, 2>, Int, VectorType<Float, 4>]>;
1620      def : Builtin<"write_imagei", [Void, ImageType<imgTy, aQual>, VectorType<Int, 2>, Int, VectorType<Int, 4>]>;
1621      def : Builtin<"write_imageui", [Void, ImageType<imgTy, aQual>, VectorType<Int, 2>, Int, VectorType<UInt, 4>]>;
1622    }
1623    def : Builtin<"write_imagef", [Void, ImageType<Image2dDepth, aQual>, VectorType<Int, 2>, Int, Float]>;
1624    foreach imgTy = [Image1d] in {
1625      def : Builtin<"write_imagef", [Void, ImageType<imgTy, aQual>, Int, Int, VectorType<Float, 4>]>;
1626      def : Builtin<"write_imagei", [Void, ImageType<imgTy, aQual>, Int, Int, VectorType<Int, 4>]>;
1627      def : Builtin<"write_imageui", [Void, ImageType<imgTy, aQual>, Int, Int, VectorType<UInt, 4>]>;
1628    }
1629    foreach imgTy = [Image1dArray] in {
1630      def : Builtin<"write_imagef", [Void, ImageType<imgTy, aQual>, VectorType<Int, 2>, Int, VectorType<Float, 4>]>;
1631      def : Builtin<"write_imagei", [Void, ImageType<imgTy, aQual>, VectorType<Int, 2>, Int, VectorType<Int, 4>]>;
1632      def : Builtin<"write_imageui", [Void, ImageType<imgTy, aQual>, VectorType<Int, 2>, Int, VectorType<UInt, 4>]>;
1633    }
1634    foreach imgTy = [Image2dArray] in {
1635      def : Builtin<"write_imagef", [Void, ImageType<imgTy, aQual>, VectorType<Int, 4>, Int, VectorType<Float, 4>]>;
1636      def : Builtin<"write_imagei", [Void, ImageType<imgTy, aQual>, VectorType<Int, 4>, Int, VectorType<Int, 4>]>;
1637      def : Builtin<"write_imageui", [Void, ImageType<imgTy, aQual>, VectorType<Int, 4>, Int, VectorType<UInt, 4>]>;
1638    }
1639    def : Builtin<"write_imagef", [Void, ImageType<Image2dArrayDepth, aQual>, VectorType<Int, 4>, Int, Float]>;
1640    foreach imgTy = [Image3d] in {
1641      def : Builtin<"write_imagef", [Void, ImageType<imgTy, aQual>, VectorType<Int, 4>, Int, VectorType<Float, 4>]>;
1642      def : Builtin<"write_imagei", [Void, ImageType<imgTy, aQual>, VectorType<Int, 4>, Int, VectorType<Int, 4>]>;
1643      def : Builtin<"write_imageui", [Void, ImageType<imgTy, aQual>, VectorType<Int, 4>, Int, VectorType<UInt, 4>]>;
1644    }
1645  }
1646}
1647
1648//--------------------------------------------------------------------
1649// OpenCL Extension v2.0 s18.3 - Creating OpenCL Memory Objects from OpenGL MSAA Textures
1650// --- Table 6.13.14.3 ---
1651multiclass ImageReadMsaa<string aQual> {
1652  foreach imgTy = [Image2dMsaa] in {
1653    def : Builtin<"read_imagef", [VectorType<Float, 4>, ImageType<imgTy, aQual>, VectorType<Int, 2>, Int], Attr.Pure>;
1654    def : Builtin<"read_imagei", [VectorType<Int, 4>, ImageType<imgTy, aQual>, VectorType<Int, 2>, Int], Attr.Pure>;
1655    def : Builtin<"read_imageui", [VectorType<UInt, 4>, ImageType<imgTy, aQual>, VectorType<Int, 2>, Int], Attr.Pure>;
1656  }
1657  foreach imgTy = [Image2dArrayMsaa] in {
1658    def : Builtin<"read_imagef", [VectorType<Float, 4>, ImageType<imgTy, aQual>, VectorType<Int, 4>, Int], Attr.Pure>;
1659    def : Builtin<"read_imagei", [VectorType<Int, 4>, ImageType<imgTy, aQual>, VectorType<Int, 4>, Int], Attr.Pure>;
1660    def : Builtin<"read_imageui", [VectorType<UInt, 4>, ImageType<imgTy, aQual>, VectorType<Int, 4>, Int], Attr.Pure>;
1661  }
1662  foreach name = ["read_imagef"] in {
1663    def : Builtin<name, [Float, ImageType<Image2dMsaaDepth, aQual>, VectorType<Int, 2>, Int], Attr.Pure>;
1664    def : Builtin<name, [Float, ImageType<Image2dArrayMsaaDepth, aQual>, VectorType<Int, 4>, Int], Attr.Pure>;
1665  }
1666}
1667
1668// --- Table 6.13.14.5 ---
1669multiclass ImageQueryMsaa<string aQual> {
1670  foreach imgTy = [Image2dMsaa, Image2dArrayMsaa, Image2dMsaaDepth, Image2dArrayMsaaDepth] in {
1671    foreach name = ["get_image_width", "get_image_height",
1672                    "get_image_channel_data_type", "get_image_channel_order",
1673                    "get_image_num_samples"] in {
1674      def : Builtin<name, [Int, ImageType<imgTy, aQual>], Attr.Const>;
1675    }
1676    def : Builtin<"get_image_dim", [VectorType<Int, 2>, ImageType<imgTy, aQual>], Attr.Const>;
1677  }
1678  foreach imgTy = [Image2dArrayMsaa, Image2dArrayMsaaDepth] in {
1679    def : Builtin<"get_image_array_size", [Size, ImageType<imgTy, aQual>], Attr.Const>;
1680  }
1681}
1682
1683let Extension = FuncExtKhrGlMsaaSharing in {
1684  defm : ImageReadMsaa<"RO">;
1685  defm : ImageQueryMsaa<"RO">;
1686  defm : ImageQueryMsaa<"WO">;
1687  defm : ImageReadMsaa<"RW">;
1688  defm : ImageQueryMsaa<"RW">;
1689}
1690
1691//--------------------------------------------------------------------
1692// OpenCL Extension v2.0 s28 - Subgroups
1693// --- Table 28.2.1 ---
1694let Extension = FuncExtKhrSubgroups in {
1695  foreach name = ["get_sub_group_size", "get_max_sub_group_size",
1696                  "get_num_sub_groups", "get_sub_group_id",
1697                  "get_sub_group_local_id"] in {
1698    def : Builtin<name, [UInt]>;
1699  }
1700  let MinVersion = CL20 in {
1701    foreach name = ["get_enqueued_num_sub_groups"] in {
1702      def : Builtin<name, [UInt]>;
1703    }
1704  }
1705}
1706
1707// --- Table 28.2.2 ---
1708let Extension = FuncExtKhrSubgroups in {
1709  def : Builtin<"sub_group_barrier", [Void, MemFenceFlags], Attr.Convergent>;
1710  let MinVersion = CL20 in {
1711    def : Builtin<"sub_group_barrier", [Void, MemFenceFlags, MemoryScope], Attr.Convergent>;
1712  }
1713}
1714
1715// --- Table 28.2.4 ---
1716let Extension = FuncExtKhrSubgroups in {
1717  foreach name = ["sub_group_all", "sub_group_any"] in {
1718    def : Builtin<name, [Int, Int], Attr.Convergent>;
1719  }
1720  foreach name = ["sub_group_broadcast"] in {
1721    def : Builtin<name, [IntLongFloatGenType1, IntLongFloatGenType1, UInt], Attr.Convergent>;
1722  }
1723  foreach name = ["sub_group_reduce_", "sub_group_scan_exclusive_",
1724                  "sub_group_scan_inclusive_"] in {
1725    foreach op = ["add", "min", "max"] in {
1726      def : Builtin<name # op, [IntLongFloatGenType1, IntLongFloatGenType1], Attr.Convergent>;
1727    }
1728  }
1729}
1730
1731// OpenCL Extension v3.0 s38 - Extended Subgroup Functions
1732
1733// Section 38.4.1 - cl_khr_subgroup_extended_types
1734let Extension = FuncExtKhrSubgroupExtendedTypes in {
1735  // For sub_group_broadcast, add scalar char, uchar, short, and ushort support,
1736  def : Builtin<"sub_group_broadcast", [CharShortGenType1, CharShortGenType1, UInt], Attr.Convergent>;
1737  // gentype may additionally be one of the supported built-in vector data types.
1738  def : Builtin<"sub_group_broadcast", [AGenTypeNNoScalar, AGenTypeNNoScalar, UInt], Attr.Convergent>;
1739
1740  foreach name = ["sub_group_reduce_", "sub_group_scan_exclusive_",
1741                  "sub_group_scan_inclusive_"] in {
1742    foreach op = ["add", "min", "max"] in {
1743      def : Builtin<name # op, [CharShortGenType1, CharShortGenType1], Attr.Convergent>;
1744    }
1745  }
1746}
1747
1748// Section 38.5.1 - cl_khr_subgroup_non_uniform_vote
1749let Extension = FuncExtKhrSubgroupNonUniformVote in {
1750  def : Builtin<"sub_group_elect", [Int]>;
1751  def : Builtin<"sub_group_non_uniform_all", [Int, Int]>;
1752  def : Builtin<"sub_group_non_uniform_any", [Int, Int]>;
1753  def : Builtin<"sub_group_non_uniform_all_equal", [Int, AGenType1]>;
1754}
1755
1756// Section 38.6.1 - cl_khr_subgroup_ballot
1757let Extension = FuncExtKhrSubgroupBallot in {
1758  def : Builtin<"sub_group_non_uniform_broadcast", [AGenTypeN, AGenTypeN, UInt]>;
1759  def : Builtin<"sub_group_broadcast_first", [AGenType1, AGenType1]>;
1760  def : Builtin<"sub_group_ballot", [VectorType<UInt, 4>, Int]>;
1761  def : Builtin<"sub_group_inverse_ballot", [Int, VectorType<UInt, 4>], Attr.Const>;
1762  def : Builtin<"sub_group_ballot_bit_extract", [Int, VectorType<UInt, 4>, UInt], Attr.Const>;
1763  def : Builtin<"sub_group_ballot_bit_count", [UInt, VectorType<UInt, 4>], Attr.Const>;
1764  def : Builtin<"sub_group_ballot_inclusive_scan", [UInt, VectorType<UInt, 4>]>;
1765  def : Builtin<"sub_group_ballot_exclusive_scan", [UInt, VectorType<UInt, 4>]>;
1766  def : Builtin<"sub_group_ballot_find_lsb", [UInt, VectorType<UInt, 4>]>;
1767  def : Builtin<"sub_group_ballot_find_msb", [UInt, VectorType<UInt, 4>]>;
1768
1769  foreach op = ["eq", "ge", "gt", "le", "lt"] in {
1770    def : Builtin<"get_sub_group_" # op # "_mask", [VectorType<UInt, 4>], Attr.Const>;
1771  }
1772}
1773
1774// Section 38.7.1 - cl_khr_subgroup_non_uniform_arithmetic
1775let Extension = FuncExtKhrSubgroupNonUniformArithmetic in {
1776  foreach name = ["reduce_", "scan_exclusive_", "scan_inclusive_"] in {
1777    foreach op = ["add", "min", "max", "mul"] in {
1778      def : Builtin<"sub_group_non_uniform_" # name # op, [AGenType1, AGenType1]>;
1779    }
1780    foreach op = ["and", "or", "xor"] in {
1781      def : Builtin<"sub_group_non_uniform_" # name # op, [AIGenType1, AIGenType1]>;
1782    }
1783    foreach op = ["and", "or", "xor"] in {
1784      def : Builtin<"sub_group_non_uniform_" # name # "logical_" # op, [Int, Int]>;
1785    }
1786  }
1787}
1788
1789// Section 38.8.1 - cl_khr_subgroup_shuffle
1790let Extension = FuncExtKhrSubgroupShuffle in {
1791  def : Builtin<"sub_group_shuffle", [AGenType1, AGenType1, UInt]>;
1792  def : Builtin<"sub_group_shuffle_xor", [AGenType1, AGenType1, UInt]>;
1793}
1794
1795// Section 38.9.1 - cl_khr_subgroup_shuffle_relative
1796let Extension = FuncExtKhrSubgroupShuffleRelative in {
1797  def : Builtin<"sub_group_shuffle_up", [AGenType1, AGenType1, UInt]>;
1798  def : Builtin<"sub_group_shuffle_down", [AGenType1, AGenType1, UInt]>;
1799}
1800
1801// Section 38.10.1 - cl_khr_subgroup_clustered_reduce
1802let Extension = FuncExtKhrSubgroupClusteredReduce in {
1803  foreach op = ["add", "min", "max", "mul"] in {
1804    def : Builtin<"sub_group_clustered_reduce_" # op, [AGenType1, AGenType1, UInt]>;
1805  }
1806  foreach op = ["and", "or", "xor"] in {
1807    def : Builtin<"sub_group_clustered_reduce_" # op, [AIGenType1, AIGenType1, UInt]>;
1808  }
1809  foreach op = ["and", "or", "xor"] in {
1810    def : Builtin<"sub_group_clustered_reduce_logical_" # op, [Int, Int, UInt]>;
1811  }
1812}
1813
1814// Section 40.3.1 - cl_khr_extended_bit_ops
1815let Extension = FuncExtKhrExtendedBitOps in {
1816  def : Builtin<"bitfield_insert", [AIGenTypeN, AIGenTypeN, AIGenTypeN, UInt, UInt], Attr.Const>;
1817  def : Builtin<"bitfield_extract_signed", [SGenTypeN, SGenTypeN, UInt, UInt], Attr.Const>;
1818  def : Builtin<"bitfield_extract_signed", [SGenTypeN, UGenTypeN, UInt, UInt], Attr.Const>;
1819  def : Builtin<"bitfield_extract_unsigned", [UGenTypeN, SGenTypeN, UInt, UInt], Attr.Const>;
1820  def : Builtin<"bitfield_extract_unsigned", [UGenTypeN, UGenTypeN, UInt, UInt], Attr.Const>;
1821  def : Builtin<"bit_reverse", [AIGenTypeN, AIGenTypeN], Attr.Const>;
1822}
1823
1824// Section 42.3 - cl_khr_integer_dot_product
1825let Extension = FunctionExtension<"__opencl_c_integer_dot_product_input_4x8bit"> in {
1826  def : Builtin<"dot", [UInt, VectorType<UChar, 4>, VectorType<UChar, 4>], Attr.Const>;
1827  def : Builtin<"dot", [Int, VectorType<Char, 4>, VectorType<Char, 4>], Attr.Const>;
1828  def : Builtin<"dot", [Int, VectorType<UChar, 4>, VectorType<Char, 4>], Attr.Const>;
1829  def : Builtin<"dot", [Int, VectorType<Char, 4>, VectorType<UChar, 4>], Attr.Const>;
1830
1831  def : Builtin<"dot_acc_sat", [UInt, VectorType<UChar, 4>, VectorType<UChar, 4>, UInt], Attr.Const>;
1832  def : Builtin<"dot_acc_sat", [Int, VectorType<Char, 4>, VectorType<Char, 4>, Int], Attr.Const>;
1833  def : Builtin<"dot_acc_sat", [Int, VectorType<UChar, 4>, VectorType<Char, 4>, Int], Attr.Const>;
1834  def : Builtin<"dot_acc_sat", [Int, VectorType<Char, 4>, VectorType<UChar, 4>, Int], Attr.Const>;
1835}
1836
1837let Extension = FunctionExtension<"__opencl_c_integer_dot_product_input_4x8bit_packed"> in {
1838  def : Builtin<"dot_4x8packed_uu_uint", [UInt, UInt, UInt], Attr.Const>;
1839  def : Builtin<"dot_4x8packed_ss_int", [Int, UInt, UInt], Attr.Const>;
1840  def : Builtin<"dot_4x8packed_us_int", [Int, UInt, UInt], Attr.Const>;
1841  def : Builtin<"dot_4x8packed_su_int", [Int, UInt, UInt], Attr.Const>;
1842
1843  def : Builtin<"dot_acc_sat_4x8packed_uu_uint", [UInt, UInt, UInt, UInt], Attr.Const>;
1844  def : Builtin<"dot_acc_sat_4x8packed_ss_int", [Int, UInt, UInt, Int], Attr.Const>;
1845  def : Builtin<"dot_acc_sat_4x8packed_us_int", [Int, UInt, UInt, Int], Attr.Const>;
1846  def : Builtin<"dot_acc_sat_4x8packed_su_int", [Int, UInt, UInt, Int], Attr.Const>;
1847}
1848
1849// Section 48.3 - cl_khr_subgroup_rotate
1850let Extension = FunctionExtension<"cl_khr_subgroup_rotate"> in {
1851  def : Builtin<"sub_group_rotate", [AGenType1, AGenType1, Int], Attr.Convergent>;
1852  def : Builtin<"sub_group_clustered_rotate", [AGenType1, AGenType1, Int, UInt], Attr.Convergent>;
1853}
1854
1855// cl_khr_kernel_clock
1856let Extension = FunctionExtension<"cl_khr_kernel_clock __opencl_c_kernel_clock_scope_device"> in {
1857  def : Builtin<"clock_read_device", [ULong]>;
1858  def : Builtin<"clock_read_hilo_device", [VectorType<UInt, 2>]>;
1859}
1860let Extension = FunctionExtension<"cl_khr_kernel_clock __opencl_c_kernel_clock_scope_work_group"> in {
1861  def : Builtin<"clock_read_work_group", [ULong]>;
1862  def : Builtin<"clock_read_hilo_work_group", [VectorType<UInt, 2>]>;
1863}
1864let Extension = FunctionExtension<"cl_khr_kernel_clock __opencl_c_kernel_clock_scope_sub_group"> in {
1865  def : Builtin<"clock_read_sub_group", [ULong]>;
1866  def : Builtin<"clock_read_hilo_sub_group", [VectorType<UInt, 2>]>;
1867}
1868
1869//--------------------------------------------------------------------
1870// Arm extensions.
1871let Extension = ArmIntegerDotProductInt8 in {
1872  foreach name = ["arm_dot"] in {
1873    def : Builtin<name, [UInt, VectorType<UChar, 4>, VectorType<UChar, 4>]>;
1874    def : Builtin<name, [Int, VectorType<Char, 4>, VectorType<Char, 4>]>;
1875  }
1876}
1877let Extension = ArmIntegerDotProductAccumulateInt8 in {
1878  foreach name = ["arm_dot_acc"] in {
1879    def : Builtin<name, [UInt, VectorType<UChar, 4>, VectorType<UChar, 4>, UInt]>;
1880    def : Builtin<name, [Int, VectorType<Char, 4>, VectorType<Char, 4>, Int]>;
1881  }
1882}
1883let Extension = ArmIntegerDotProductAccumulateInt16 in {
1884  foreach name = ["arm_dot_acc"] in {
1885    def : Builtin<name, [UInt, VectorType<UShort, 2>, VectorType<UShort, 2>, UInt]>;
1886    def : Builtin<name, [Int, VectorType<Short, 2>, VectorType<Short, 2>, Int]>;
1887  }
1888}
1889let Extension = ArmIntegerDotProductAccumulateSaturateInt8 in {
1890  foreach name = ["arm_dot_acc_sat"] in {
1891    def : Builtin<name, [UInt, VectorType<UChar, 4>, VectorType<UChar, 4>, UInt]>;
1892    def : Builtin<name, [Int, VectorType<Char, 4>, VectorType<Char, 4>, Int]>;
1893  }
1894}
1895