xref: /freebsd/contrib/llvm-project/clang/lib/CodeGen/CGOpenMPRuntime.h (revision 5e801ac66d24704442eba426ed13c3effb8a34e7)
1 //===----- CGOpenMPRuntime.h - Interface to OpenMP Runtimes -----*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This provides a class for OpenMP runtime code generation.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #ifndef LLVM_CLANG_LIB_CODEGEN_CGOPENMPRUNTIME_H
14 #define LLVM_CLANG_LIB_CODEGEN_CGOPENMPRUNTIME_H
15 
16 #include "CGValue.h"
17 #include "clang/AST/DeclOpenMP.h"
18 #include "clang/AST/GlobalDecl.h"
19 #include "clang/AST/Type.h"
20 #include "clang/Basic/OpenMPKinds.h"
21 #include "clang/Basic/SourceLocation.h"
22 #include "llvm/ADT/DenseMap.h"
23 #include "llvm/ADT/PointerIntPair.h"
24 #include "llvm/ADT/SmallPtrSet.h"
25 #include "llvm/ADT/StringMap.h"
26 #include "llvm/ADT/StringSet.h"
27 #include "llvm/Frontend/OpenMP/OMPConstants.h"
28 #include "llvm/Frontend/OpenMP/OMPIRBuilder.h"
29 #include "llvm/IR/Function.h"
30 #include "llvm/IR/ValueHandle.h"
31 #include "llvm/Support/AtomicOrdering.h"
32 
33 namespace llvm {
34 class ArrayType;
35 class Constant;
36 class FunctionType;
37 class GlobalVariable;
38 class StructType;
39 class Type;
40 class Value;
41 class OpenMPIRBuilder;
42 } // namespace llvm
43 
44 namespace clang {
45 class Expr;
46 class OMPDependClause;
47 class OMPExecutableDirective;
48 class OMPLoopDirective;
49 class VarDecl;
50 class OMPDeclareReductionDecl;
51 class IdentifierInfo;
52 
53 namespace CodeGen {
54 class Address;
55 class CodeGenFunction;
56 class CodeGenModule;
57 
58 /// A basic class for pre|post-action for advanced codegen sequence for OpenMP
59 /// region.
60 class PrePostActionTy {
61 public:
62   explicit PrePostActionTy() {}
63   virtual void Enter(CodeGenFunction &CGF) {}
64   virtual void Exit(CodeGenFunction &CGF) {}
65   virtual ~PrePostActionTy() {}
66 };
67 
68 /// Class provides a way to call simple version of codegen for OpenMP region, or
69 /// an advanced with possible pre|post-actions in codegen.
70 class RegionCodeGenTy final {
71   intptr_t CodeGen;
72   typedef void (*CodeGenTy)(intptr_t, CodeGenFunction &, PrePostActionTy &);
73   CodeGenTy Callback;
74   mutable PrePostActionTy *PrePostAction;
75   RegionCodeGenTy() = delete;
76   template <typename Callable>
77   static void CallbackFn(intptr_t CodeGen, CodeGenFunction &CGF,
78                          PrePostActionTy &Action) {
79     return (*reinterpret_cast<Callable *>(CodeGen))(CGF, Action);
80   }
81 
82 public:
83   template <typename Callable>
84   RegionCodeGenTy(
85       Callable &&CodeGen,
86       std::enable_if_t<!std::is_same<std::remove_reference_t<Callable>,
87                                      RegionCodeGenTy>::value> * = nullptr)
88       : CodeGen(reinterpret_cast<intptr_t>(&CodeGen)),
89         Callback(CallbackFn<std::remove_reference_t<Callable>>),
90         PrePostAction(nullptr) {}
91   void setAction(PrePostActionTy &Action) const { PrePostAction = &Action; }
92   void operator()(CodeGenFunction &CGF) const;
93 };
94 
95 struct OMPTaskDataTy final {
96   SmallVector<const Expr *, 4> PrivateVars;
97   SmallVector<const Expr *, 4> PrivateCopies;
98   SmallVector<const Expr *, 4> FirstprivateVars;
99   SmallVector<const Expr *, 4> FirstprivateCopies;
100   SmallVector<const Expr *, 4> FirstprivateInits;
101   SmallVector<const Expr *, 4> LastprivateVars;
102   SmallVector<const Expr *, 4> LastprivateCopies;
103   SmallVector<const Expr *, 4> ReductionVars;
104   SmallVector<const Expr *, 4> ReductionOrigs;
105   SmallVector<const Expr *, 4> ReductionCopies;
106   SmallVector<const Expr *, 4> ReductionOps;
107   SmallVector<CanonicalDeclPtr<const VarDecl>, 4> PrivateLocals;
108   struct DependData {
109     OpenMPDependClauseKind DepKind = OMPC_DEPEND_unknown;
110     const Expr *IteratorExpr = nullptr;
111     SmallVector<const Expr *, 4> DepExprs;
112     explicit DependData() = default;
113     DependData(OpenMPDependClauseKind DepKind, const Expr *IteratorExpr)
114         : DepKind(DepKind), IteratorExpr(IteratorExpr) {}
115   };
116   SmallVector<DependData, 4> Dependences;
117   llvm::PointerIntPair<llvm::Value *, 1, bool> Final;
118   llvm::PointerIntPair<llvm::Value *, 1, bool> Schedule;
119   llvm::PointerIntPair<llvm::Value *, 1, bool> Priority;
120   llvm::Value *Reductions = nullptr;
121   unsigned NumberOfParts = 0;
122   bool Tied = true;
123   bool Nogroup = false;
124   bool IsReductionWithTaskMod = false;
125   bool IsWorksharingReduction = false;
126 };
127 
128 /// Class intended to support codegen of all kind of the reduction clauses.
129 class ReductionCodeGen {
130 private:
131   /// Data required for codegen of reduction clauses.
132   struct ReductionData {
133     /// Reference to the item shared between tasks to reduce into.
134     const Expr *Shared = nullptr;
135     /// Reference to the original item.
136     const Expr *Ref = nullptr;
137     /// Helper expression for generation of private copy.
138     const Expr *Private = nullptr;
139     /// Helper expression for generation reduction operation.
140     const Expr *ReductionOp = nullptr;
141     ReductionData(const Expr *Shared, const Expr *Ref, const Expr *Private,
142                   const Expr *ReductionOp)
143         : Shared(Shared), Ref(Ref), Private(Private), ReductionOp(ReductionOp) {
144     }
145   };
146   /// List of reduction-based clauses.
147   SmallVector<ReductionData, 4> ClausesData;
148 
149   /// List of addresses of shared variables/expressions.
150   SmallVector<std::pair<LValue, LValue>, 4> SharedAddresses;
151   /// List of addresses of original variables/expressions.
152   SmallVector<std::pair<LValue, LValue>, 4> OrigAddresses;
153   /// Sizes of the reduction items in chars.
154   SmallVector<std::pair<llvm::Value *, llvm::Value *>, 4> Sizes;
155   /// Base declarations for the reduction items.
156   SmallVector<const VarDecl *, 4> BaseDecls;
157 
158   /// Emits lvalue for shared expression.
159   LValue emitSharedLValue(CodeGenFunction &CGF, const Expr *E);
160   /// Emits upper bound for shared expression (if array section).
161   LValue emitSharedLValueUB(CodeGenFunction &CGF, const Expr *E);
162   /// Performs aggregate initialization.
163   /// \param N Number of reduction item in the common list.
164   /// \param PrivateAddr Address of the corresponding private item.
165   /// \param SharedLVal Address of the original shared variable.
166   /// \param DRD Declare reduction construct used for reduction item.
167   void emitAggregateInitialization(CodeGenFunction &CGF, unsigned N,
168                                    Address PrivateAddr, LValue SharedLVal,
169                                    const OMPDeclareReductionDecl *DRD);
170 
171 public:
172   ReductionCodeGen(ArrayRef<const Expr *> Shareds, ArrayRef<const Expr *> Origs,
173                    ArrayRef<const Expr *> Privates,
174                    ArrayRef<const Expr *> ReductionOps);
175   /// Emits lvalue for the shared and original reduction item.
176   /// \param N Number of the reduction item.
177   void emitSharedOrigLValue(CodeGenFunction &CGF, unsigned N);
178   /// Emits the code for the variable-modified type, if required.
179   /// \param N Number of the reduction item.
180   void emitAggregateType(CodeGenFunction &CGF, unsigned N);
181   /// Emits the code for the variable-modified type, if required.
182   /// \param N Number of the reduction item.
183   /// \param Size Size of the type in chars.
184   void emitAggregateType(CodeGenFunction &CGF, unsigned N, llvm::Value *Size);
185   /// Performs initialization of the private copy for the reduction item.
186   /// \param N Number of the reduction item.
187   /// \param PrivateAddr Address of the corresponding private item.
188   /// \param DefaultInit Default initialization sequence that should be
189   /// performed if no reduction specific initialization is found.
190   /// \param SharedLVal Address of the original shared variable.
191   void
192   emitInitialization(CodeGenFunction &CGF, unsigned N, Address PrivateAddr,
193                      LValue SharedLVal,
194                      llvm::function_ref<bool(CodeGenFunction &)> DefaultInit);
195   /// Returns true if the private copy requires cleanups.
196   bool needCleanups(unsigned N);
197   /// Emits cleanup code for the reduction item.
198   /// \param N Number of the reduction item.
199   /// \param PrivateAddr Address of the corresponding private item.
200   void emitCleanups(CodeGenFunction &CGF, unsigned N, Address PrivateAddr);
201   /// Adjusts \p PrivatedAddr for using instead of the original variable
202   /// address in normal operations.
203   /// \param N Number of the reduction item.
204   /// \param PrivateAddr Address of the corresponding private item.
205   Address adjustPrivateAddress(CodeGenFunction &CGF, unsigned N,
206                                Address PrivateAddr);
207   /// Returns LValue for the reduction item.
208   LValue getSharedLValue(unsigned N) const { return SharedAddresses[N].first; }
209   /// Returns LValue for the original reduction item.
210   LValue getOrigLValue(unsigned N) const { return OrigAddresses[N].first; }
211   /// Returns the size of the reduction item (in chars and total number of
212   /// elements in the item), or nullptr, if the size is a constant.
213   std::pair<llvm::Value *, llvm::Value *> getSizes(unsigned N) const {
214     return Sizes[N];
215   }
216   /// Returns the base declaration of the reduction item.
217   const VarDecl *getBaseDecl(unsigned N) const { return BaseDecls[N]; }
218   /// Returns the base declaration of the reduction item.
219   const Expr *getRefExpr(unsigned N) const { return ClausesData[N].Ref; }
220   /// Returns true if the initialization of the reduction item uses initializer
221   /// from declare reduction construct.
222   bool usesReductionInitializer(unsigned N) const;
223 };
224 
225 class CGOpenMPRuntime {
226 public:
227   /// Allows to disable automatic handling of functions used in target regions
228   /// as those marked as `omp declare target`.
229   class DisableAutoDeclareTargetRAII {
230     CodeGenModule &CGM;
231     bool SavedShouldMarkAsGlobal;
232 
233   public:
234     DisableAutoDeclareTargetRAII(CodeGenModule &CGM);
235     ~DisableAutoDeclareTargetRAII();
236   };
237 
238   /// Manages list of nontemporal decls for the specified directive.
239   class NontemporalDeclsRAII {
240     CodeGenModule &CGM;
241     const bool NeedToPush;
242 
243   public:
244     NontemporalDeclsRAII(CodeGenModule &CGM, const OMPLoopDirective &S);
245     ~NontemporalDeclsRAII();
246   };
247 
248   /// Manages list of nontemporal decls for the specified directive.
249   class UntiedTaskLocalDeclsRAII {
250     CodeGenModule &CGM;
251     const bool NeedToPush;
252 
253   public:
254     UntiedTaskLocalDeclsRAII(
255         CodeGenFunction &CGF,
256         const llvm::MapVector<CanonicalDeclPtr<const VarDecl>,
257                               std::pair<Address, Address>> &LocalVars);
258     ~UntiedTaskLocalDeclsRAII();
259   };
260 
261   /// Maps the expression for the lastprivate variable to the global copy used
262   /// to store new value because original variables are not mapped in inner
263   /// parallel regions. Only private copies are captured but we need also to
264   /// store private copy in shared address.
265   /// Also, stores the expression for the private loop counter and it
266   /// threaprivate name.
267   struct LastprivateConditionalData {
268     llvm::MapVector<CanonicalDeclPtr<const Decl>, SmallString<16>>
269         DeclToUniqueName;
270     LValue IVLVal;
271     llvm::Function *Fn = nullptr;
272     bool Disabled = false;
273   };
274   /// Manages list of lastprivate conditional decls for the specified directive.
275   class LastprivateConditionalRAII {
276     enum class ActionToDo {
277       DoNotPush,
278       PushAsLastprivateConditional,
279       DisableLastprivateConditional,
280     };
281     CodeGenModule &CGM;
282     ActionToDo Action = ActionToDo::DoNotPush;
283 
284     /// Check and try to disable analysis of inner regions for changes in
285     /// lastprivate conditional.
286     void tryToDisableInnerAnalysis(const OMPExecutableDirective &S,
287                                    llvm::DenseSet<CanonicalDeclPtr<const Decl>>
288                                        &NeedToAddForLPCsAsDisabled) const;
289 
290     LastprivateConditionalRAII(CodeGenFunction &CGF,
291                                const OMPExecutableDirective &S);
292 
293   public:
294     explicit LastprivateConditionalRAII(CodeGenFunction &CGF,
295                                         const OMPExecutableDirective &S,
296                                         LValue IVLVal);
297     static LastprivateConditionalRAII disable(CodeGenFunction &CGF,
298                                               const OMPExecutableDirective &S);
299     ~LastprivateConditionalRAII();
300   };
301 
302   llvm::OpenMPIRBuilder &getOMPBuilder() { return OMPBuilder; }
303 
304 protected:
305   CodeGenModule &CGM;
306   StringRef FirstSeparator, Separator;
307 
308   /// An OpenMP-IR-Builder instance.
309   llvm::OpenMPIRBuilder OMPBuilder;
310 
311   /// Constructor allowing to redefine the name separator for the variables.
312   explicit CGOpenMPRuntime(CodeGenModule &CGM, StringRef FirstSeparator,
313                            StringRef Separator);
314 
315   /// Creates offloading entry for the provided entry ID \a ID,
316   /// address \a Addr, size \a Size, and flags \a Flags.
317   virtual void createOffloadEntry(llvm::Constant *ID, llvm::Constant *Addr,
318                                   uint64_t Size, int32_t Flags,
319                                   llvm::GlobalValue::LinkageTypes Linkage);
320 
321   /// Helper to emit outlined function for 'target' directive.
322   /// \param D Directive to emit.
323   /// \param ParentName Name of the function that encloses the target region.
324   /// \param OutlinedFn Outlined function value to be defined by this call.
325   /// \param OutlinedFnID Outlined function ID value to be defined by this call.
326   /// \param IsOffloadEntry True if the outlined function is an offload entry.
327   /// \param CodeGen Lambda codegen specific to an accelerator device.
328   /// An outlined function may not be an entry if, e.g. the if clause always
329   /// evaluates to false.
330   virtual void emitTargetOutlinedFunctionHelper(const OMPExecutableDirective &D,
331                                                 StringRef ParentName,
332                                                 llvm::Function *&OutlinedFn,
333                                                 llvm::Constant *&OutlinedFnID,
334                                                 bool IsOffloadEntry,
335                                                 const RegionCodeGenTy &CodeGen);
336 
337   /// Emits object of ident_t type with info for source location.
338   /// \param Flags Flags for OpenMP location.
339   ///
340   llvm::Value *emitUpdateLocation(CodeGenFunction &CGF, SourceLocation Loc,
341                                   unsigned Flags = 0);
342 
343   /// Emit the number of teams for a target directive.  Inspect the num_teams
344   /// clause associated with a teams construct combined or closely nested
345   /// with the target directive.
346   ///
347   /// Emit a team of size one for directives such as 'target parallel' that
348   /// have no associated teams construct.
349   ///
350   /// Otherwise, return nullptr.
351   const Expr *getNumTeamsExprForTargetDirective(CodeGenFunction &CGF,
352                                                 const OMPExecutableDirective &D,
353                                                 int32_t &DefaultVal);
354   llvm::Value *emitNumTeamsForTargetDirective(CodeGenFunction &CGF,
355                                               const OMPExecutableDirective &D);
356   /// Emit the number of threads for a target directive.  Inspect the
357   /// thread_limit clause associated with a teams construct combined or closely
358   /// nested with the target directive.
359   ///
360   /// Emit the num_threads clause for directives such as 'target parallel' that
361   /// have no associated teams construct.
362   ///
363   /// Otherwise, return nullptr.
364   const Expr *
365   getNumThreadsExprForTargetDirective(CodeGenFunction &CGF,
366                                       const OMPExecutableDirective &D,
367                                       int32_t &DefaultVal);
368   llvm::Value *
369   emitNumThreadsForTargetDirective(CodeGenFunction &CGF,
370                                    const OMPExecutableDirective &D);
371 
372   /// Returns pointer to ident_t type.
373   llvm::Type *getIdentTyPointerTy();
374 
375   /// Gets thread id value for the current thread.
376   ///
377   llvm::Value *getThreadID(CodeGenFunction &CGF, SourceLocation Loc);
378 
379   /// Get the function name of an outlined region.
380   //  The name can be customized depending on the target.
381   //
382   virtual StringRef getOutlinedHelperName() const { return ".omp_outlined."; }
383 
384   /// Emits \p Callee function call with arguments \p Args with location \p Loc.
385   void emitCall(CodeGenFunction &CGF, SourceLocation Loc,
386                 llvm::FunctionCallee Callee,
387                 ArrayRef<llvm::Value *> Args = llvm::None) const;
388 
389   /// Emits address of the word in a memory where current thread id is
390   /// stored.
391   virtual Address emitThreadIDAddress(CodeGenFunction &CGF, SourceLocation Loc);
392 
393   void setLocThreadIdInsertPt(CodeGenFunction &CGF,
394                               bool AtCurrentPoint = false);
395   void clearLocThreadIdInsertPt(CodeGenFunction &CGF);
396 
397   /// Check if the default location must be constant.
398   /// Default is false to support OMPT/OMPD.
399   virtual bool isDefaultLocationConstant() const { return false; }
400 
401   /// Returns additional flags that can be stored in reserved_2 field of the
402   /// default location.
403   virtual unsigned getDefaultLocationReserved2Flags() const { return 0; }
404 
405   /// Returns default flags for the barriers depending on the directive, for
406   /// which this barier is going to be emitted.
407   static unsigned getDefaultFlagsForBarriers(OpenMPDirectiveKind Kind);
408 
409   /// Get the LLVM type for the critical name.
410   llvm::ArrayType *getKmpCriticalNameTy() const {return KmpCriticalNameTy;}
411 
412   /// Returns corresponding lock object for the specified critical region
413   /// name. If the lock object does not exist it is created, otherwise the
414   /// reference to the existing copy is returned.
415   /// \param CriticalName Name of the critical region.
416   ///
417   llvm::Value *getCriticalRegionLock(StringRef CriticalName);
418 
419 private:
420 
421   /// Map for SourceLocation and OpenMP runtime library debug locations.
422   typedef llvm::DenseMap<SourceLocation, llvm::Value *> OpenMPDebugLocMapTy;
423   OpenMPDebugLocMapTy OpenMPDebugLocMap;
424   /// The type for a microtask which gets passed to __kmpc_fork_call().
425   /// Original representation is:
426   /// typedef void (kmpc_micro)(kmp_int32 global_tid, kmp_int32 bound_tid,...);
427   llvm::FunctionType *Kmpc_MicroTy = nullptr;
428   /// Stores debug location and ThreadID for the function.
429   struct DebugLocThreadIdTy {
430     llvm::Value *DebugLoc;
431     llvm::Value *ThreadID;
432     /// Insert point for the service instructions.
433     llvm::AssertingVH<llvm::Instruction> ServiceInsertPt = nullptr;
434   };
435   /// Map of local debug location, ThreadId and functions.
436   typedef llvm::DenseMap<llvm::Function *, DebugLocThreadIdTy>
437       OpenMPLocThreadIDMapTy;
438   OpenMPLocThreadIDMapTy OpenMPLocThreadIDMap;
439   /// Map of UDRs and corresponding combiner/initializer.
440   typedef llvm::DenseMap<const OMPDeclareReductionDecl *,
441                          std::pair<llvm::Function *, llvm::Function *>>
442       UDRMapTy;
443   UDRMapTy UDRMap;
444   /// Map of functions and locally defined UDRs.
445   typedef llvm::DenseMap<llvm::Function *,
446                          SmallVector<const OMPDeclareReductionDecl *, 4>>
447       FunctionUDRMapTy;
448   FunctionUDRMapTy FunctionUDRMap;
449   /// Map from the user-defined mapper declaration to its corresponding
450   /// functions.
451   llvm::DenseMap<const OMPDeclareMapperDecl *, llvm::Function *> UDMMap;
452   /// Map of functions and their local user-defined mappers.
453   using FunctionUDMMapTy =
454       llvm::DenseMap<llvm::Function *,
455                      SmallVector<const OMPDeclareMapperDecl *, 4>>;
456   FunctionUDMMapTy FunctionUDMMap;
457   /// Maps local variables marked as lastprivate conditional to their internal
458   /// types.
459   llvm::DenseMap<llvm::Function *,
460                  llvm::DenseMap<CanonicalDeclPtr<const Decl>,
461                                 std::tuple<QualType, const FieldDecl *,
462                                            const FieldDecl *, LValue>>>
463       LastprivateConditionalToTypes;
464   /// Maps function to the position of the untied task locals stack.
465   llvm::DenseMap<llvm::Function *, unsigned> FunctionToUntiedTaskStackMap;
466   /// Type kmp_critical_name, originally defined as typedef kmp_int32
467   /// kmp_critical_name[8];
468   llvm::ArrayType *KmpCriticalNameTy;
469   /// An ordered map of auto-generated variables to their unique names.
470   /// It stores variables with the following names: 1) ".gomp_critical_user_" +
471   /// <critical_section_name> + ".var" for "omp critical" directives; 2)
472   /// <mangled_name_for_global_var> + ".cache." for cache for threadprivate
473   /// variables.
474   llvm::StringMap<llvm::AssertingVH<llvm::Constant>, llvm::BumpPtrAllocator>
475       InternalVars;
476   /// Type typedef kmp_int32 (* kmp_routine_entry_t)(kmp_int32, void *);
477   llvm::Type *KmpRoutineEntryPtrTy = nullptr;
478   QualType KmpRoutineEntryPtrQTy;
479   /// Type typedef struct kmp_task {
480   ///    void *              shareds; /**< pointer to block of pointers to
481   ///    shared vars   */
482   ///    kmp_routine_entry_t routine; /**< pointer to routine to call for
483   ///    executing task */
484   ///    kmp_int32           part_id; /**< part id for the task */
485   ///    kmp_routine_entry_t destructors; /* pointer to function to invoke
486   ///    deconstructors of firstprivate C++ objects */
487   /// } kmp_task_t;
488   QualType KmpTaskTQTy;
489   /// Saved kmp_task_t for task directive.
490   QualType SavedKmpTaskTQTy;
491   /// Saved kmp_task_t for taskloop-based directive.
492   QualType SavedKmpTaskloopTQTy;
493   /// Type typedef struct kmp_depend_info {
494   ///    kmp_intptr_t               base_addr;
495   ///    size_t                     len;
496   ///    struct {
497   ///             bool                   in:1;
498   ///             bool                   out:1;
499   ///    } flags;
500   /// } kmp_depend_info_t;
501   QualType KmpDependInfoTy;
502   /// Type typedef struct kmp_task_affinity_info {
503   ///    kmp_intptr_t base_addr;
504   ///    size_t len;
505   ///    struct {
506   ///      bool flag1 : 1;
507   ///      bool flag2 : 1;
508   ///      kmp_int32 reserved : 30;
509   ///   } flags;
510   /// } kmp_task_affinity_info_t;
511   QualType KmpTaskAffinityInfoTy;
512   /// struct kmp_dim {  // loop bounds info casted to kmp_int64
513   ///  kmp_int64 lo; // lower
514   ///  kmp_int64 up; // upper
515   ///  kmp_int64 st; // stride
516   /// };
517   QualType KmpDimTy;
518   /// Type struct __tgt_offload_entry{
519   ///   void      *addr;       // Pointer to the offload entry info.
520   ///                          // (function or global)
521   ///   char      *name;       // Name of the function or global.
522   ///   size_t     size;       // Size of the entry info (0 if it a function).
523   ///   int32_t flags;
524   ///   int32_t reserved;
525   /// };
526   QualType TgtOffloadEntryQTy;
527   /// Entity that registers the offloading constants that were emitted so
528   /// far.
529   class OffloadEntriesInfoManagerTy {
530     CodeGenModule &CGM;
531 
532     /// Number of entries registered so far.
533     unsigned OffloadingEntriesNum = 0;
534 
535   public:
536     /// Base class of the entries info.
537     class OffloadEntryInfo {
538     public:
539       /// Kind of a given entry.
540       enum OffloadingEntryInfoKinds : unsigned {
541         /// Entry is a target region.
542         OffloadingEntryInfoTargetRegion = 0,
543         /// Entry is a declare target variable.
544         OffloadingEntryInfoDeviceGlobalVar = 1,
545         /// Invalid entry info.
546         OffloadingEntryInfoInvalid = ~0u
547       };
548 
549     protected:
550       OffloadEntryInfo() = delete;
551       explicit OffloadEntryInfo(OffloadingEntryInfoKinds Kind) : Kind(Kind) {}
552       explicit OffloadEntryInfo(OffloadingEntryInfoKinds Kind, unsigned Order,
553                                 uint32_t Flags)
554           : Flags(Flags), Order(Order), Kind(Kind) {}
555       ~OffloadEntryInfo() = default;
556 
557     public:
558       bool isValid() const { return Order != ~0u; }
559       unsigned getOrder() const { return Order; }
560       OffloadingEntryInfoKinds getKind() const { return Kind; }
561       uint32_t getFlags() const { return Flags; }
562       void setFlags(uint32_t NewFlags) { Flags = NewFlags; }
563       llvm::Constant *getAddress() const {
564         return cast_or_null<llvm::Constant>(Addr);
565       }
566       void setAddress(llvm::Constant *V) {
567         assert(!Addr.pointsToAliveValue() && "Address has been set before!");
568         Addr = V;
569       }
570       static bool classof(const OffloadEntryInfo *Info) { return true; }
571 
572     private:
573       /// Address of the entity that has to be mapped for offloading.
574       llvm::WeakTrackingVH Addr;
575 
576       /// Flags associated with the device global.
577       uint32_t Flags = 0u;
578 
579       /// Order this entry was emitted.
580       unsigned Order = ~0u;
581 
582       OffloadingEntryInfoKinds Kind = OffloadingEntryInfoInvalid;
583     };
584 
585     /// Return true if a there are no entries defined.
586     bool empty() const;
587     /// Return number of entries defined so far.
588     unsigned size() const { return OffloadingEntriesNum; }
589     OffloadEntriesInfoManagerTy(CodeGenModule &CGM) : CGM(CGM) {}
590 
591     //
592     // Target region entries related.
593     //
594 
595     /// Kind of the target registry entry.
596     enum OMPTargetRegionEntryKind : uint32_t {
597       /// Mark the entry as target region.
598       OMPTargetRegionEntryTargetRegion = 0x0,
599       /// Mark the entry as a global constructor.
600       OMPTargetRegionEntryCtor = 0x02,
601       /// Mark the entry as a global destructor.
602       OMPTargetRegionEntryDtor = 0x04,
603     };
604 
605     /// Target region entries info.
606     class OffloadEntryInfoTargetRegion final : public OffloadEntryInfo {
607       /// Address that can be used as the ID of the entry.
608       llvm::Constant *ID = nullptr;
609 
610     public:
611       OffloadEntryInfoTargetRegion()
612           : OffloadEntryInfo(OffloadingEntryInfoTargetRegion) {}
613       explicit OffloadEntryInfoTargetRegion(unsigned Order,
614                                             llvm::Constant *Addr,
615                                             llvm::Constant *ID,
616                                             OMPTargetRegionEntryKind Flags)
617           : OffloadEntryInfo(OffloadingEntryInfoTargetRegion, Order, Flags),
618             ID(ID) {
619         setAddress(Addr);
620       }
621 
622       llvm::Constant *getID() const { return ID; }
623       void setID(llvm::Constant *V) {
624         assert(!ID && "ID has been set before!");
625         ID = V;
626       }
627       static bool classof(const OffloadEntryInfo *Info) {
628         return Info->getKind() == OffloadingEntryInfoTargetRegion;
629       }
630     };
631 
632     /// Initialize target region entry.
633     void initializeTargetRegionEntryInfo(unsigned DeviceID, unsigned FileID,
634                                          StringRef ParentName, unsigned LineNum,
635                                          unsigned Order);
636     /// Register target region entry.
637     void registerTargetRegionEntryInfo(unsigned DeviceID, unsigned FileID,
638                                        StringRef ParentName, unsigned LineNum,
639                                        llvm::Constant *Addr, llvm::Constant *ID,
640                                        OMPTargetRegionEntryKind Flags);
641     /// Return true if a target region entry with the provided information
642     /// exists.
643     bool hasTargetRegionEntryInfo(unsigned DeviceID, unsigned FileID,
644                                   StringRef ParentName, unsigned LineNum,
645                                   bool IgnoreAddressId = false) const;
646     /// brief Applies action \a Action on all registered entries.
647     typedef llvm::function_ref<void(unsigned, unsigned, StringRef, unsigned,
648                                     const OffloadEntryInfoTargetRegion &)>
649         OffloadTargetRegionEntryInfoActTy;
650     void actOnTargetRegionEntriesInfo(
651         const OffloadTargetRegionEntryInfoActTy &Action);
652 
653     //
654     // Device global variable entries related.
655     //
656 
657     /// Kind of the global variable entry..
658     enum OMPTargetGlobalVarEntryKind : uint32_t {
659       /// Mark the entry as a to declare target.
660       OMPTargetGlobalVarEntryTo = 0x0,
661       /// Mark the entry as a to declare target link.
662       OMPTargetGlobalVarEntryLink = 0x1,
663     };
664 
665     /// Device global variable entries info.
666     class OffloadEntryInfoDeviceGlobalVar final : public OffloadEntryInfo {
667       /// Type of the global variable.
668      CharUnits VarSize;
669      llvm::GlobalValue::LinkageTypes Linkage;
670 
671    public:
672      OffloadEntryInfoDeviceGlobalVar()
673          : OffloadEntryInfo(OffloadingEntryInfoDeviceGlobalVar) {}
674      explicit OffloadEntryInfoDeviceGlobalVar(unsigned Order,
675                                               OMPTargetGlobalVarEntryKind Flags)
676          : OffloadEntryInfo(OffloadingEntryInfoDeviceGlobalVar, Order, Flags) {}
677      explicit OffloadEntryInfoDeviceGlobalVar(
678          unsigned Order, llvm::Constant *Addr, CharUnits VarSize,
679          OMPTargetGlobalVarEntryKind Flags,
680          llvm::GlobalValue::LinkageTypes Linkage)
681          : OffloadEntryInfo(OffloadingEntryInfoDeviceGlobalVar, Order, Flags),
682            VarSize(VarSize), Linkage(Linkage) {
683        setAddress(Addr);
684       }
685 
686       CharUnits getVarSize() const { return VarSize; }
687       void setVarSize(CharUnits Size) { VarSize = Size; }
688       llvm::GlobalValue::LinkageTypes getLinkage() const { return Linkage; }
689       void setLinkage(llvm::GlobalValue::LinkageTypes LT) { Linkage = LT; }
690       static bool classof(const OffloadEntryInfo *Info) {
691         return Info->getKind() == OffloadingEntryInfoDeviceGlobalVar;
692       }
693     };
694 
695     /// Initialize device global variable entry.
696     void initializeDeviceGlobalVarEntryInfo(StringRef Name,
697                                             OMPTargetGlobalVarEntryKind Flags,
698                                             unsigned Order);
699 
700     /// Register device global variable entry.
701     void
702     registerDeviceGlobalVarEntryInfo(StringRef VarName, llvm::Constant *Addr,
703                                      CharUnits VarSize,
704                                      OMPTargetGlobalVarEntryKind Flags,
705                                      llvm::GlobalValue::LinkageTypes Linkage);
706     /// Checks if the variable with the given name has been registered already.
707     bool hasDeviceGlobalVarEntryInfo(StringRef VarName) const {
708       return OffloadEntriesDeviceGlobalVar.count(VarName) > 0;
709     }
710     /// Applies action \a Action on all registered entries.
711     typedef llvm::function_ref<void(StringRef,
712                                     const OffloadEntryInfoDeviceGlobalVar &)>
713         OffloadDeviceGlobalVarEntryInfoActTy;
714     void actOnDeviceGlobalVarEntriesInfo(
715         const OffloadDeviceGlobalVarEntryInfoActTy &Action);
716 
717   private:
718     // Storage for target region entries kind. The storage is to be indexed by
719     // file ID, device ID, parent function name and line number.
720     typedef llvm::DenseMap<unsigned, OffloadEntryInfoTargetRegion>
721         OffloadEntriesTargetRegionPerLine;
722     typedef llvm::StringMap<OffloadEntriesTargetRegionPerLine>
723         OffloadEntriesTargetRegionPerParentName;
724     typedef llvm::DenseMap<unsigned, OffloadEntriesTargetRegionPerParentName>
725         OffloadEntriesTargetRegionPerFile;
726     typedef llvm::DenseMap<unsigned, OffloadEntriesTargetRegionPerFile>
727         OffloadEntriesTargetRegionPerDevice;
728     typedef OffloadEntriesTargetRegionPerDevice OffloadEntriesTargetRegionTy;
729     OffloadEntriesTargetRegionTy OffloadEntriesTargetRegion;
730     /// Storage for device global variable entries kind. The storage is to be
731     /// indexed by mangled name.
732     typedef llvm::StringMap<OffloadEntryInfoDeviceGlobalVar>
733         OffloadEntriesDeviceGlobalVarTy;
734     OffloadEntriesDeviceGlobalVarTy OffloadEntriesDeviceGlobalVar;
735   };
736   OffloadEntriesInfoManagerTy OffloadEntriesInfoManager;
737 
738   bool ShouldMarkAsGlobal = true;
739   /// List of the emitted declarations.
740   llvm::DenseSet<CanonicalDeclPtr<const Decl>> AlreadyEmittedTargetDecls;
741   /// List of the global variables with their addresses that should not be
742   /// emitted for the target.
743   llvm::StringMap<llvm::WeakTrackingVH> EmittedNonTargetVariables;
744 
745   /// List of variables that can become declare target implicitly and, thus,
746   /// must be emitted.
747   llvm::SmallDenseSet<const VarDecl *> DeferredGlobalVariables;
748 
749   using NontemporalDeclsSet = llvm::SmallDenseSet<CanonicalDeclPtr<const Decl>>;
750   /// Stack for list of declarations in current context marked as nontemporal.
751   /// The set is the union of all current stack elements.
752   llvm::SmallVector<NontemporalDeclsSet, 4> NontemporalDeclsStack;
753 
754   using UntiedLocalVarsAddressesMap =
755       llvm::MapVector<CanonicalDeclPtr<const VarDecl>,
756                       std::pair<Address, Address>>;
757   llvm::SmallVector<UntiedLocalVarsAddressesMap, 4> UntiedLocalVarsStack;
758 
759   /// Stack for list of addresses of declarations in current context marked as
760   /// lastprivate conditional. The set is the union of all current stack
761   /// elements.
762   llvm::SmallVector<LastprivateConditionalData, 4> LastprivateConditionalStack;
763 
764   /// Flag for keeping track of weather a requires unified_shared_memory
765   /// directive is present.
766   bool HasRequiresUnifiedSharedMemory = false;
767 
768   /// Atomic ordering from the omp requires directive.
769   llvm::AtomicOrdering RequiresAtomicOrdering = llvm::AtomicOrdering::Monotonic;
770 
771   /// Flag for keeping track of weather a target region has been emitted.
772   bool HasEmittedTargetRegion = false;
773 
774   /// Flag for keeping track of weather a device routine has been emitted.
775   /// Device routines are specific to the
776   bool HasEmittedDeclareTargetRegion = false;
777 
778   /// Loads all the offload entries information from the host IR
779   /// metadata.
780   void loadOffloadInfoMetadata();
781 
782   /// Returns __tgt_offload_entry type.
783   QualType getTgtOffloadEntryQTy();
784 
785   /// Start scanning from statement \a S and and emit all target regions
786   /// found along the way.
787   /// \param S Starting statement.
788   /// \param ParentName Name of the function declaration that is being scanned.
789   void scanForTargetRegionsFunctions(const Stmt *S, StringRef ParentName);
790 
791   /// Build type kmp_routine_entry_t (if not built yet).
792   void emitKmpRoutineEntryT(QualType KmpInt32Ty);
793 
794   /// Returns pointer to kmpc_micro type.
795   llvm::Type *getKmpc_MicroPointerTy();
796 
797   /// Returns __kmpc_for_static_init_* runtime function for the specified
798   /// size \a IVSize and sign \a IVSigned. Will create a distribute call
799   /// __kmpc_distribute_static_init* if \a IsGPUDistribute is set.
800   llvm::FunctionCallee createForStaticInitFunction(unsigned IVSize,
801                                                    bool IVSigned,
802                                                    bool IsGPUDistribute);
803 
804   /// Returns __kmpc_dispatch_init_* runtime function for the specified
805   /// size \a IVSize and sign \a IVSigned.
806   llvm::FunctionCallee createDispatchInitFunction(unsigned IVSize,
807                                                   bool IVSigned);
808 
809   /// Returns __kmpc_dispatch_next_* runtime function for the specified
810   /// size \a IVSize and sign \a IVSigned.
811   llvm::FunctionCallee createDispatchNextFunction(unsigned IVSize,
812                                                   bool IVSigned);
813 
814   /// Returns __kmpc_dispatch_fini_* runtime function for the specified
815   /// size \a IVSize and sign \a IVSigned.
816   llvm::FunctionCallee createDispatchFiniFunction(unsigned IVSize,
817                                                   bool IVSigned);
818 
819   /// If the specified mangled name is not in the module, create and
820   /// return threadprivate cache object. This object is a pointer's worth of
821   /// storage that's reserved for use by the OpenMP runtime.
822   /// \param VD Threadprivate variable.
823   /// \return Cache variable for the specified threadprivate.
824   llvm::Constant *getOrCreateThreadPrivateCache(const VarDecl *VD);
825 
826   /// Gets (if variable with the given name already exist) or creates
827   /// internal global variable with the specified Name. The created variable has
828   /// linkage CommonLinkage by default and is initialized by null value.
829   /// \param Ty Type of the global variable. If it is exist already the type
830   /// must be the same.
831   /// \param Name Name of the variable.
832   llvm::Constant *getOrCreateInternalVariable(llvm::Type *Ty,
833                                               const llvm::Twine &Name,
834                                               unsigned AddressSpace = 0);
835 
836   /// Set of threadprivate variables with the generated initializer.
837   llvm::StringSet<> ThreadPrivateWithDefinition;
838 
839   /// Set of declare target variables with the generated initializer.
840   llvm::StringSet<> DeclareTargetWithDefinition;
841 
842   /// Emits initialization code for the threadprivate variables.
843   /// \param VDAddr Address of the global variable \a VD.
844   /// \param Ctor Pointer to a global init function for \a VD.
845   /// \param CopyCtor Pointer to a global copy function for \a VD.
846   /// \param Dtor Pointer to a global destructor function for \a VD.
847   /// \param Loc Location of threadprivate declaration.
848   void emitThreadPrivateVarInit(CodeGenFunction &CGF, Address VDAddr,
849                                 llvm::Value *Ctor, llvm::Value *CopyCtor,
850                                 llvm::Value *Dtor, SourceLocation Loc);
851 
852   /// Emit the array initialization or deletion portion for user-defined mapper
853   /// code generation.
854   void emitUDMapperArrayInitOrDel(CodeGenFunction &MapperCGF,
855                                   llvm::Value *Handle, llvm::Value *BasePtr,
856                                   llvm::Value *Ptr, llvm::Value *Size,
857                                   llvm::Value *MapType, llvm::Value *MapName,
858                                   CharUnits ElementSize,
859                                   llvm::BasicBlock *ExitBB, bool IsInit);
860 
861   struct TaskResultTy {
862     llvm::Value *NewTask = nullptr;
863     llvm::Function *TaskEntry = nullptr;
864     llvm::Value *NewTaskNewTaskTTy = nullptr;
865     LValue TDBase;
866     const RecordDecl *KmpTaskTQTyRD = nullptr;
867     llvm::Value *TaskDupFn = nullptr;
868   };
869   /// Emit task region for the task directive. The task region is emitted in
870   /// several steps:
871   /// 1. Emit a call to kmp_task_t *__kmpc_omp_task_alloc(ident_t *, kmp_int32
872   /// gtid, kmp_int32 flags, size_t sizeof_kmp_task_t, size_t sizeof_shareds,
873   /// kmp_routine_entry_t *task_entry). Here task_entry is a pointer to the
874   /// function:
875   /// kmp_int32 .omp_task_entry.(kmp_int32 gtid, kmp_task_t *tt) {
876   ///   TaskFunction(gtid, tt->part_id, tt->shareds);
877   ///   return 0;
878   /// }
879   /// 2. Copy a list of shared variables to field shareds of the resulting
880   /// structure kmp_task_t returned by the previous call (if any).
881   /// 3. Copy a pointer to destructions function to field destructions of the
882   /// resulting structure kmp_task_t.
883   /// \param D Current task directive.
884   /// \param TaskFunction An LLVM function with type void (*)(i32 /*gtid*/, i32
885   /// /*part_id*/, captured_struct */*__context*/);
886   /// \param SharedsTy A type which contains references the shared variables.
887   /// \param Shareds Context with the list of shared variables from the \p
888   /// TaskFunction.
889   /// \param Data Additional data for task generation like tiednsee, final
890   /// state, list of privates etc.
891   TaskResultTy emitTaskInit(CodeGenFunction &CGF, SourceLocation Loc,
892                             const OMPExecutableDirective &D,
893                             llvm::Function *TaskFunction, QualType SharedsTy,
894                             Address Shareds, const OMPTaskDataTy &Data);
895 
896   /// Emit code that pushes the trip count of loops associated with constructs
897   /// 'target teams distribute' and 'teams distribute parallel for'.
898   /// \param SizeEmitter Emits the int64 value for the number of iterations of
899   /// the associated loop.
900   void emitTargetNumIterationsCall(
901       CodeGenFunction &CGF, const OMPExecutableDirective &D,
902       llvm::Value *DeviceID,
903       llvm::function_ref<llvm::Value *(CodeGenFunction &CGF,
904                                        const OMPLoopDirective &D)>
905           SizeEmitter);
906 
907   /// Emit update for lastprivate conditional data.
908   void emitLastprivateConditionalUpdate(CodeGenFunction &CGF, LValue IVLVal,
909                                         StringRef UniqueDeclName, LValue LVal,
910                                         SourceLocation Loc);
911 
912   /// Returns the number of the elements and the address of the depobj
913   /// dependency array.
914   /// \return Number of elements in depobj array and the pointer to the array of
915   /// dependencies.
916   std::pair<llvm::Value *, LValue> getDepobjElements(CodeGenFunction &CGF,
917                                                      LValue DepobjLVal,
918                                                      SourceLocation Loc);
919 
920 public:
921   explicit CGOpenMPRuntime(CodeGenModule &CGM)
922       : CGOpenMPRuntime(CGM, ".", ".") {}
923   virtual ~CGOpenMPRuntime() {}
924   virtual void clear();
925 
926   /// Emits code for OpenMP 'if' clause using specified \a CodeGen
927   /// function. Here is the logic:
928   /// if (Cond) {
929   ///   ThenGen();
930   /// } else {
931   ///   ElseGen();
932   /// }
933   void emitIfClause(CodeGenFunction &CGF, const Expr *Cond,
934                     const RegionCodeGenTy &ThenGen,
935                     const RegionCodeGenTy &ElseGen);
936 
937   /// Checks if the \p Body is the \a CompoundStmt and returns its child
938   /// statement iff there is only one that is not evaluatable at the compile
939   /// time.
940   static const Stmt *getSingleCompoundChild(ASTContext &Ctx, const Stmt *Body);
941 
942   /// Get the platform-specific name separator.
943   std::string getName(ArrayRef<StringRef> Parts) const;
944 
945   /// Emit code for the specified user defined reduction construct.
946   virtual void emitUserDefinedReduction(CodeGenFunction *CGF,
947                                         const OMPDeclareReductionDecl *D);
948   /// Get combiner/initializer for the specified user-defined reduction, if any.
949   virtual std::pair<llvm::Function *, llvm::Function *>
950   getUserDefinedReduction(const OMPDeclareReductionDecl *D);
951 
952   /// Emit the function for the user defined mapper construct.
953   void emitUserDefinedMapper(const OMPDeclareMapperDecl *D,
954                              CodeGenFunction *CGF = nullptr);
955   /// Get the function for the specified user-defined mapper. If it does not
956   /// exist, create one.
957   llvm::Function *
958   getOrCreateUserDefinedMapperFunc(const OMPDeclareMapperDecl *D);
959 
960   /// Emits outlined function for the specified OpenMP parallel directive
961   /// \a D. This outlined function has type void(*)(kmp_int32 *ThreadID,
962   /// kmp_int32 BoundID, struct context_vars*).
963   /// \param D OpenMP directive.
964   /// \param ThreadIDVar Variable for thread id in the current OpenMP region.
965   /// \param InnermostKind Kind of innermost directive (for simple directives it
966   /// is a directive itself, for combined - its innermost directive).
967   /// \param CodeGen Code generation sequence for the \a D directive.
968   virtual llvm::Function *emitParallelOutlinedFunction(
969       const OMPExecutableDirective &D, const VarDecl *ThreadIDVar,
970       OpenMPDirectiveKind InnermostKind, const RegionCodeGenTy &CodeGen);
971 
972   /// Emits outlined function for the specified OpenMP teams directive
973   /// \a D. This outlined function has type void(*)(kmp_int32 *ThreadID,
974   /// kmp_int32 BoundID, struct context_vars*).
975   /// \param D OpenMP directive.
976   /// \param ThreadIDVar Variable for thread id in the current OpenMP region.
977   /// \param InnermostKind Kind of innermost directive (for simple directives it
978   /// is a directive itself, for combined - its innermost directive).
979   /// \param CodeGen Code generation sequence for the \a D directive.
980   virtual llvm::Function *emitTeamsOutlinedFunction(
981       const OMPExecutableDirective &D, const VarDecl *ThreadIDVar,
982       OpenMPDirectiveKind InnermostKind, const RegionCodeGenTy &CodeGen);
983 
984   /// Emits outlined function for the OpenMP task directive \a D. This
985   /// outlined function has type void(*)(kmp_int32 ThreadID, struct task_t*
986   /// TaskT).
987   /// \param D OpenMP directive.
988   /// \param ThreadIDVar Variable for thread id in the current OpenMP region.
989   /// \param PartIDVar Variable for partition id in the current OpenMP untied
990   /// task region.
991   /// \param TaskTVar Variable for task_t argument.
992   /// \param InnermostKind Kind of innermost directive (for simple directives it
993   /// is a directive itself, for combined - its innermost directive).
994   /// \param CodeGen Code generation sequence for the \a D directive.
995   /// \param Tied true if task is generated for tied task, false otherwise.
996   /// \param NumberOfParts Number of parts in untied task. Ignored for tied
997   /// tasks.
998   ///
999   virtual llvm::Function *emitTaskOutlinedFunction(
1000       const OMPExecutableDirective &D, const VarDecl *ThreadIDVar,
1001       const VarDecl *PartIDVar, const VarDecl *TaskTVar,
1002       OpenMPDirectiveKind InnermostKind, const RegionCodeGenTy &CodeGen,
1003       bool Tied, unsigned &NumberOfParts);
1004 
1005   /// Cleans up references to the objects in finished function.
1006   ///
1007   virtual void functionFinished(CodeGenFunction &CGF);
1008 
1009   /// Emits code for parallel or serial call of the \a OutlinedFn with
1010   /// variables captured in a record which address is stored in \a
1011   /// CapturedStruct.
1012   /// \param OutlinedFn Outlined function to be run in parallel threads. Type of
1013   /// this function is void(*)(kmp_int32 *, kmp_int32, struct context_vars*).
1014   /// \param CapturedVars A pointer to the record with the references to
1015   /// variables used in \a OutlinedFn function.
1016   /// \param IfCond Condition in the associated 'if' clause, if it was
1017   /// specified, nullptr otherwise.
1018   ///
1019   virtual void emitParallelCall(CodeGenFunction &CGF, SourceLocation Loc,
1020                                 llvm::Function *OutlinedFn,
1021                                 ArrayRef<llvm::Value *> CapturedVars,
1022                                 const Expr *IfCond);
1023 
1024   /// Emits a critical region.
1025   /// \param CriticalName Name of the critical region.
1026   /// \param CriticalOpGen Generator for the statement associated with the given
1027   /// critical region.
1028   /// \param Hint Value of the 'hint' clause (optional).
1029   virtual void emitCriticalRegion(CodeGenFunction &CGF, StringRef CriticalName,
1030                                   const RegionCodeGenTy &CriticalOpGen,
1031                                   SourceLocation Loc,
1032                                   const Expr *Hint = nullptr);
1033 
1034   /// Emits a master region.
1035   /// \param MasterOpGen Generator for the statement associated with the given
1036   /// master region.
1037   virtual void emitMasterRegion(CodeGenFunction &CGF,
1038                                 const RegionCodeGenTy &MasterOpGen,
1039                                 SourceLocation Loc);
1040 
1041   /// Emits a masked region.
1042   /// \param MaskedOpGen Generator for the statement associated with the given
1043   /// masked region.
1044   virtual void emitMaskedRegion(CodeGenFunction &CGF,
1045                                 const RegionCodeGenTy &MaskedOpGen,
1046                                 SourceLocation Loc,
1047                                 const Expr *Filter = nullptr);
1048 
1049   /// Emits code for a taskyield directive.
1050   virtual void emitTaskyieldCall(CodeGenFunction &CGF, SourceLocation Loc);
1051 
1052   /// Emit a taskgroup region.
1053   /// \param TaskgroupOpGen Generator for the statement associated with the
1054   /// given taskgroup region.
1055   virtual void emitTaskgroupRegion(CodeGenFunction &CGF,
1056                                    const RegionCodeGenTy &TaskgroupOpGen,
1057                                    SourceLocation Loc);
1058 
1059   /// Emits a single region.
1060   /// \param SingleOpGen Generator for the statement associated with the given
1061   /// single region.
1062   virtual void emitSingleRegion(CodeGenFunction &CGF,
1063                                 const RegionCodeGenTy &SingleOpGen,
1064                                 SourceLocation Loc,
1065                                 ArrayRef<const Expr *> CopyprivateVars,
1066                                 ArrayRef<const Expr *> DestExprs,
1067                                 ArrayRef<const Expr *> SrcExprs,
1068                                 ArrayRef<const Expr *> AssignmentOps);
1069 
1070   /// Emit an ordered region.
1071   /// \param OrderedOpGen Generator for the statement associated with the given
1072   /// ordered region.
1073   virtual void emitOrderedRegion(CodeGenFunction &CGF,
1074                                  const RegionCodeGenTy &OrderedOpGen,
1075                                  SourceLocation Loc, bool IsThreads);
1076 
1077   /// Emit an implicit/explicit barrier for OpenMP threads.
1078   /// \param Kind Directive for which this implicit barrier call must be
1079   /// generated. Must be OMPD_barrier for explicit barrier generation.
1080   /// \param EmitChecks true if need to emit checks for cancellation barriers.
1081   /// \param ForceSimpleCall true simple barrier call must be emitted, false if
1082   /// runtime class decides which one to emit (simple or with cancellation
1083   /// checks).
1084   ///
1085   virtual void emitBarrierCall(CodeGenFunction &CGF, SourceLocation Loc,
1086                                OpenMPDirectiveKind Kind,
1087                                bool EmitChecks = true,
1088                                bool ForceSimpleCall = false);
1089 
1090   /// Check if the specified \a ScheduleKind is static non-chunked.
1091   /// This kind of worksharing directive is emitted without outer loop.
1092   /// \param ScheduleKind Schedule kind specified in the 'schedule' clause.
1093   /// \param Chunked True if chunk is specified in the clause.
1094   ///
1095   virtual bool isStaticNonchunked(OpenMPScheduleClauseKind ScheduleKind,
1096                                   bool Chunked) const;
1097 
1098   /// Check if the specified \a ScheduleKind is static non-chunked.
1099   /// This kind of distribute directive is emitted without outer loop.
1100   /// \param ScheduleKind Schedule kind specified in the 'dist_schedule' clause.
1101   /// \param Chunked True if chunk is specified in the clause.
1102   ///
1103   virtual bool isStaticNonchunked(OpenMPDistScheduleClauseKind ScheduleKind,
1104                                   bool Chunked) const;
1105 
1106   /// Check if the specified \a ScheduleKind is static chunked.
1107   /// \param ScheduleKind Schedule kind specified in the 'schedule' clause.
1108   /// \param Chunked True if chunk is specified in the clause.
1109   ///
1110   virtual bool isStaticChunked(OpenMPScheduleClauseKind ScheduleKind,
1111                                bool Chunked) const;
1112 
1113   /// Check if the specified \a ScheduleKind is static non-chunked.
1114   /// \param ScheduleKind Schedule kind specified in the 'dist_schedule' clause.
1115   /// \param Chunked True if chunk is specified in the clause.
1116   ///
1117   virtual bool isStaticChunked(OpenMPDistScheduleClauseKind ScheduleKind,
1118                                bool Chunked) const;
1119 
1120   /// Check if the specified \a ScheduleKind is dynamic.
1121   /// This kind of worksharing directive is emitted without outer loop.
1122   /// \param ScheduleKind Schedule Kind specified in the 'schedule' clause.
1123   ///
1124   virtual bool isDynamic(OpenMPScheduleClauseKind ScheduleKind) const;
1125 
1126   /// struct with the values to be passed to the dispatch runtime function
1127   struct DispatchRTInput {
1128     /// Loop lower bound
1129     llvm::Value *LB = nullptr;
1130     /// Loop upper bound
1131     llvm::Value *UB = nullptr;
1132     /// Chunk size specified using 'schedule' clause (nullptr if chunk
1133     /// was not specified)
1134     llvm::Value *Chunk = nullptr;
1135     DispatchRTInput() = default;
1136     DispatchRTInput(llvm::Value *LB, llvm::Value *UB, llvm::Value *Chunk)
1137         : LB(LB), UB(UB), Chunk(Chunk) {}
1138   };
1139 
1140   /// Call the appropriate runtime routine to initialize it before start
1141   /// of loop.
1142 
1143   /// This is used for non static scheduled types and when the ordered
1144   /// clause is present on the loop construct.
1145   /// Depending on the loop schedule, it is necessary to call some runtime
1146   /// routine before start of the OpenMP loop to get the loop upper / lower
1147   /// bounds \a LB and \a UB and stride \a ST.
1148   ///
1149   /// \param CGF Reference to current CodeGenFunction.
1150   /// \param Loc Clang source location.
1151   /// \param ScheduleKind Schedule kind, specified by the 'schedule' clause.
1152   /// \param IVSize Size of the iteration variable in bits.
1153   /// \param IVSigned Sign of the iteration variable.
1154   /// \param Ordered true if loop is ordered, false otherwise.
1155   /// \param DispatchValues struct containing llvm values for lower bound, upper
1156   /// bound, and chunk expression.
1157   /// For the default (nullptr) value, the chunk 1 will be used.
1158   ///
1159   virtual void emitForDispatchInit(CodeGenFunction &CGF, SourceLocation Loc,
1160                                    const OpenMPScheduleTy &ScheduleKind,
1161                                    unsigned IVSize, bool IVSigned, bool Ordered,
1162                                    const DispatchRTInput &DispatchValues);
1163 
1164   /// Struct with the values to be passed to the static runtime function
1165   struct StaticRTInput {
1166     /// Size of the iteration variable in bits.
1167     unsigned IVSize = 0;
1168     /// Sign of the iteration variable.
1169     bool IVSigned = false;
1170     /// true if loop is ordered, false otherwise.
1171     bool Ordered = false;
1172     /// Address of the output variable in which the flag of the last iteration
1173     /// is returned.
1174     Address IL = Address::invalid();
1175     /// Address of the output variable in which the lower iteration number is
1176     /// returned.
1177     Address LB = Address::invalid();
1178     /// Address of the output variable in which the upper iteration number is
1179     /// returned.
1180     Address UB = Address::invalid();
1181     /// Address of the output variable in which the stride value is returned
1182     /// necessary to generated the static_chunked scheduled loop.
1183     Address ST = Address::invalid();
1184     /// Value of the chunk for the static_chunked scheduled loop. For the
1185     /// default (nullptr) value, the chunk 1 will be used.
1186     llvm::Value *Chunk = nullptr;
1187     StaticRTInput(unsigned IVSize, bool IVSigned, bool Ordered, Address IL,
1188                   Address LB, Address UB, Address ST,
1189                   llvm::Value *Chunk = nullptr)
1190         : IVSize(IVSize), IVSigned(IVSigned), Ordered(Ordered), IL(IL), LB(LB),
1191           UB(UB), ST(ST), Chunk(Chunk) {}
1192   };
1193   /// Call the appropriate runtime routine to initialize it before start
1194   /// of loop.
1195   ///
1196   /// This is used only in case of static schedule, when the user did not
1197   /// specify a ordered clause on the loop construct.
1198   /// Depending on the loop schedule, it is necessary to call some runtime
1199   /// routine before start of the OpenMP loop to get the loop upper / lower
1200   /// bounds LB and UB and stride ST.
1201   ///
1202   /// \param CGF Reference to current CodeGenFunction.
1203   /// \param Loc Clang source location.
1204   /// \param DKind Kind of the directive.
1205   /// \param ScheduleKind Schedule kind, specified by the 'schedule' clause.
1206   /// \param Values Input arguments for the construct.
1207   ///
1208   virtual void emitForStaticInit(CodeGenFunction &CGF, SourceLocation Loc,
1209                                  OpenMPDirectiveKind DKind,
1210                                  const OpenMPScheduleTy &ScheduleKind,
1211                                  const StaticRTInput &Values);
1212 
1213   ///
1214   /// \param CGF Reference to current CodeGenFunction.
1215   /// \param Loc Clang source location.
1216   /// \param SchedKind Schedule kind, specified by the 'dist_schedule' clause.
1217   /// \param Values Input arguments for the construct.
1218   ///
1219   virtual void emitDistributeStaticInit(CodeGenFunction &CGF,
1220                                         SourceLocation Loc,
1221                                         OpenMPDistScheduleClauseKind SchedKind,
1222                                         const StaticRTInput &Values);
1223 
1224   /// Call the appropriate runtime routine to notify that we finished
1225   /// iteration of the ordered loop with the dynamic scheduling.
1226   ///
1227   /// \param CGF Reference to current CodeGenFunction.
1228   /// \param Loc Clang source location.
1229   /// \param IVSize Size of the iteration variable in bits.
1230   /// \param IVSigned Sign of the iteration variable.
1231   ///
1232   virtual void emitForOrderedIterationEnd(CodeGenFunction &CGF,
1233                                           SourceLocation Loc, unsigned IVSize,
1234                                           bool IVSigned);
1235 
1236   /// Call the appropriate runtime routine to notify that we finished
1237   /// all the work with current loop.
1238   ///
1239   /// \param CGF Reference to current CodeGenFunction.
1240   /// \param Loc Clang source location.
1241   /// \param DKind Kind of the directive for which the static finish is emitted.
1242   ///
1243   virtual void emitForStaticFinish(CodeGenFunction &CGF, SourceLocation Loc,
1244                                    OpenMPDirectiveKind DKind);
1245 
1246   /// Call __kmpc_dispatch_next(
1247   ///          ident_t *loc, kmp_int32 tid, kmp_int32 *p_lastiter,
1248   ///          kmp_int[32|64] *p_lower, kmp_int[32|64] *p_upper,
1249   ///          kmp_int[32|64] *p_stride);
1250   /// \param IVSize Size of the iteration variable in bits.
1251   /// \param IVSigned Sign of the iteration variable.
1252   /// \param IL Address of the output variable in which the flag of the
1253   /// last iteration is returned.
1254   /// \param LB Address of the output variable in which the lower iteration
1255   /// number is returned.
1256   /// \param UB Address of the output variable in which the upper iteration
1257   /// number is returned.
1258   /// \param ST Address of the output variable in which the stride value is
1259   /// returned.
1260   virtual llvm::Value *emitForNext(CodeGenFunction &CGF, SourceLocation Loc,
1261                                    unsigned IVSize, bool IVSigned,
1262                                    Address IL, Address LB,
1263                                    Address UB, Address ST);
1264 
1265   /// Emits call to void __kmpc_push_num_threads(ident_t *loc, kmp_int32
1266   /// global_tid, kmp_int32 num_threads) to generate code for 'num_threads'
1267   /// clause.
1268   /// \param NumThreads An integer value of threads.
1269   virtual void emitNumThreadsClause(CodeGenFunction &CGF,
1270                                     llvm::Value *NumThreads,
1271                                     SourceLocation Loc);
1272 
1273   /// Emit call to void __kmpc_push_proc_bind(ident_t *loc, kmp_int32
1274   /// global_tid, int proc_bind) to generate code for 'proc_bind' clause.
1275   virtual void emitProcBindClause(CodeGenFunction &CGF,
1276                                   llvm::omp::ProcBindKind ProcBind,
1277                                   SourceLocation Loc);
1278 
1279   /// Returns address of the threadprivate variable for the current
1280   /// thread.
1281   /// \param VD Threadprivate variable.
1282   /// \param VDAddr Address of the global variable \a VD.
1283   /// \param Loc Location of the reference to threadprivate var.
1284   /// \return Address of the threadprivate variable for the current thread.
1285   virtual Address getAddrOfThreadPrivate(CodeGenFunction &CGF,
1286                                          const VarDecl *VD,
1287                                          Address VDAddr,
1288                                          SourceLocation Loc);
1289 
1290   /// Returns the address of the variable marked as declare target with link
1291   /// clause OR as declare target with to clause and unified memory.
1292   virtual Address getAddrOfDeclareTargetVar(const VarDecl *VD);
1293 
1294   /// Emit a code for initialization of threadprivate variable. It emits
1295   /// a call to runtime library which adds initial value to the newly created
1296   /// threadprivate variable (if it is not constant) and registers destructor
1297   /// for the variable (if any).
1298   /// \param VD Threadprivate variable.
1299   /// \param VDAddr Address of the global variable \a VD.
1300   /// \param Loc Location of threadprivate declaration.
1301   /// \param PerformInit true if initialization expression is not constant.
1302   virtual llvm::Function *
1303   emitThreadPrivateVarDefinition(const VarDecl *VD, Address VDAddr,
1304                                  SourceLocation Loc, bool PerformInit,
1305                                  CodeGenFunction *CGF = nullptr);
1306 
1307   /// Emit a code for initialization of declare target variable.
1308   /// \param VD Declare target variable.
1309   /// \param Addr Address of the global variable \a VD.
1310   /// \param PerformInit true if initialization expression is not constant.
1311   virtual bool emitDeclareTargetVarDefinition(const VarDecl *VD,
1312                                               llvm::GlobalVariable *Addr,
1313                                               bool PerformInit);
1314 
1315   /// Creates artificial threadprivate variable with name \p Name and type \p
1316   /// VarType.
1317   /// \param VarType Type of the artificial threadprivate variable.
1318   /// \param Name Name of the artificial threadprivate variable.
1319   virtual Address getAddrOfArtificialThreadPrivate(CodeGenFunction &CGF,
1320                                                    QualType VarType,
1321                                                    StringRef Name);
1322 
1323   /// Emit flush of the variables specified in 'omp flush' directive.
1324   /// \param Vars List of variables to flush.
1325   virtual void emitFlush(CodeGenFunction &CGF, ArrayRef<const Expr *> Vars,
1326                          SourceLocation Loc, llvm::AtomicOrdering AO);
1327 
1328   /// Emit task region for the task directive. The task region is
1329   /// emitted in several steps:
1330   /// 1. Emit a call to kmp_task_t *__kmpc_omp_task_alloc(ident_t *, kmp_int32
1331   /// gtid, kmp_int32 flags, size_t sizeof_kmp_task_t, size_t sizeof_shareds,
1332   /// kmp_routine_entry_t *task_entry). Here task_entry is a pointer to the
1333   /// function:
1334   /// kmp_int32 .omp_task_entry.(kmp_int32 gtid, kmp_task_t *tt) {
1335   ///   TaskFunction(gtid, tt->part_id, tt->shareds);
1336   ///   return 0;
1337   /// }
1338   /// 2. Copy a list of shared variables to field shareds of the resulting
1339   /// structure kmp_task_t returned by the previous call (if any).
1340   /// 3. Copy a pointer to destructions function to field destructions of the
1341   /// resulting structure kmp_task_t.
1342   /// 4. Emit a call to kmp_int32 __kmpc_omp_task(ident_t *, kmp_int32 gtid,
1343   /// kmp_task_t *new_task), where new_task is a resulting structure from
1344   /// previous items.
1345   /// \param D Current task directive.
1346   /// \param TaskFunction An LLVM function with type void (*)(i32 /*gtid*/, i32
1347   /// /*part_id*/, captured_struct */*__context*/);
1348   /// \param SharedsTy A type which contains references the shared variables.
1349   /// \param Shareds Context with the list of shared variables from the \p
1350   /// TaskFunction.
1351   /// \param IfCond Not a nullptr if 'if' clause was specified, nullptr
1352   /// otherwise.
1353   /// \param Data Additional data for task generation like tiednsee, final
1354   /// state, list of privates etc.
1355   virtual void emitTaskCall(CodeGenFunction &CGF, SourceLocation Loc,
1356                             const OMPExecutableDirective &D,
1357                             llvm::Function *TaskFunction, QualType SharedsTy,
1358                             Address Shareds, const Expr *IfCond,
1359                             const OMPTaskDataTy &Data);
1360 
1361   /// Emit task region for the taskloop directive. The taskloop region is
1362   /// emitted in several steps:
1363   /// 1. Emit a call to kmp_task_t *__kmpc_omp_task_alloc(ident_t *, kmp_int32
1364   /// gtid, kmp_int32 flags, size_t sizeof_kmp_task_t, size_t sizeof_shareds,
1365   /// kmp_routine_entry_t *task_entry). Here task_entry is a pointer to the
1366   /// function:
1367   /// kmp_int32 .omp_task_entry.(kmp_int32 gtid, kmp_task_t *tt) {
1368   ///   TaskFunction(gtid, tt->part_id, tt->shareds);
1369   ///   return 0;
1370   /// }
1371   /// 2. Copy a list of shared variables to field shareds of the resulting
1372   /// structure kmp_task_t returned by the previous call (if any).
1373   /// 3. Copy a pointer to destructions function to field destructions of the
1374   /// resulting structure kmp_task_t.
1375   /// 4. Emit a call to void __kmpc_taskloop(ident_t *loc, int gtid, kmp_task_t
1376   /// *task, int if_val, kmp_uint64 *lb, kmp_uint64 *ub, kmp_int64 st, int
1377   /// nogroup, int sched, kmp_uint64 grainsize, void *task_dup ), where new_task
1378   /// is a resulting structure from
1379   /// previous items.
1380   /// \param D Current task directive.
1381   /// \param TaskFunction An LLVM function with type void (*)(i32 /*gtid*/, i32
1382   /// /*part_id*/, captured_struct */*__context*/);
1383   /// \param SharedsTy A type which contains references the shared variables.
1384   /// \param Shareds Context with the list of shared variables from the \p
1385   /// TaskFunction.
1386   /// \param IfCond Not a nullptr if 'if' clause was specified, nullptr
1387   /// otherwise.
1388   /// \param Data Additional data for task generation like tiednsee, final
1389   /// state, list of privates etc.
1390   virtual void emitTaskLoopCall(CodeGenFunction &CGF, SourceLocation Loc,
1391                                 const OMPLoopDirective &D,
1392                                 llvm::Function *TaskFunction,
1393                                 QualType SharedsTy, Address Shareds,
1394                                 const Expr *IfCond, const OMPTaskDataTy &Data);
1395 
1396   /// Emit code for the directive that does not require outlining.
1397   ///
1398   /// \param InnermostKind Kind of innermost directive (for simple directives it
1399   /// is a directive itself, for combined - its innermost directive).
1400   /// \param CodeGen Code generation sequence for the \a D directive.
1401   /// \param HasCancel true if region has inner cancel directive, false
1402   /// otherwise.
1403   virtual void emitInlinedDirective(CodeGenFunction &CGF,
1404                                     OpenMPDirectiveKind InnermostKind,
1405                                     const RegionCodeGenTy &CodeGen,
1406                                     bool HasCancel = false);
1407 
1408   /// Emits reduction function.
1409   /// \param ArgsType Array type containing pointers to reduction variables.
1410   /// \param Privates List of private copies for original reduction arguments.
1411   /// \param LHSExprs List of LHS in \a ReductionOps reduction operations.
1412   /// \param RHSExprs List of RHS in \a ReductionOps reduction operations.
1413   /// \param ReductionOps List of reduction operations in form 'LHS binop RHS'
1414   /// or 'operator binop(LHS, RHS)'.
1415   llvm::Function *emitReductionFunction(SourceLocation Loc,
1416                                         llvm::Type *ArgsType,
1417                                         ArrayRef<const Expr *> Privates,
1418                                         ArrayRef<const Expr *> LHSExprs,
1419                                         ArrayRef<const Expr *> RHSExprs,
1420                                         ArrayRef<const Expr *> ReductionOps);
1421 
1422   /// Emits single reduction combiner
1423   void emitSingleReductionCombiner(CodeGenFunction &CGF,
1424                                    const Expr *ReductionOp,
1425                                    const Expr *PrivateRef,
1426                                    const DeclRefExpr *LHS,
1427                                    const DeclRefExpr *RHS);
1428 
1429   struct ReductionOptionsTy {
1430     bool WithNowait;
1431     bool SimpleReduction;
1432     OpenMPDirectiveKind ReductionKind;
1433   };
1434   /// Emit a code for reduction clause. Next code should be emitted for
1435   /// reduction:
1436   /// \code
1437   ///
1438   /// static kmp_critical_name lock = { 0 };
1439   ///
1440   /// void reduce_func(void *lhs[<n>], void *rhs[<n>]) {
1441   ///  ...
1442   ///  *(Type<i>*)lhs[i] = RedOp<i>(*(Type<i>*)lhs[i], *(Type<i>*)rhs[i]);
1443   ///  ...
1444   /// }
1445   ///
1446   /// ...
1447   /// void *RedList[<n>] = {&<RHSExprs>[0], ..., &<RHSExprs>[<n>-1]};
1448   /// switch (__kmpc_reduce{_nowait}(<loc>, <gtid>, <n>, sizeof(RedList),
1449   /// RedList, reduce_func, &<lock>)) {
1450   /// case 1:
1451   ///  ...
1452   ///  <LHSExprs>[i] = RedOp<i>(*<LHSExprs>[i], *<RHSExprs>[i]);
1453   ///  ...
1454   /// __kmpc_end_reduce{_nowait}(<loc>, <gtid>, &<lock>);
1455   /// break;
1456   /// case 2:
1457   ///  ...
1458   ///  Atomic(<LHSExprs>[i] = RedOp<i>(*<LHSExprs>[i], *<RHSExprs>[i]));
1459   ///  ...
1460   /// break;
1461   /// default:;
1462   /// }
1463   /// \endcode
1464   ///
1465   /// \param Privates List of private copies for original reduction arguments.
1466   /// \param LHSExprs List of LHS in \a ReductionOps reduction operations.
1467   /// \param RHSExprs List of RHS in \a ReductionOps reduction operations.
1468   /// \param ReductionOps List of reduction operations in form 'LHS binop RHS'
1469   /// or 'operator binop(LHS, RHS)'.
1470   /// \param Options List of options for reduction codegen:
1471   ///     WithNowait true if parent directive has also nowait clause, false
1472   ///     otherwise.
1473   ///     SimpleReduction Emit reduction operation only. Used for omp simd
1474   ///     directive on the host.
1475   ///     ReductionKind The kind of reduction to perform.
1476   virtual void emitReduction(CodeGenFunction &CGF, SourceLocation Loc,
1477                              ArrayRef<const Expr *> Privates,
1478                              ArrayRef<const Expr *> LHSExprs,
1479                              ArrayRef<const Expr *> RHSExprs,
1480                              ArrayRef<const Expr *> ReductionOps,
1481                              ReductionOptionsTy Options);
1482 
1483   /// Emit a code for initialization of task reduction clause. Next code
1484   /// should be emitted for reduction:
1485   /// \code
1486   ///
1487   /// _taskred_item_t red_data[n];
1488   /// ...
1489   /// red_data[i].shar = &shareds[i];
1490   /// red_data[i].orig = &origs[i];
1491   /// red_data[i].size = sizeof(origs[i]);
1492   /// red_data[i].f_init = (void*)RedInit<i>;
1493   /// red_data[i].f_fini = (void*)RedDest<i>;
1494   /// red_data[i].f_comb = (void*)RedOp<i>;
1495   /// red_data[i].flags = <Flag_i>;
1496   /// ...
1497   /// void* tg1 = __kmpc_taskred_init(gtid, n, red_data);
1498   /// \endcode
1499   /// For reduction clause with task modifier it emits the next call:
1500   /// \code
1501   ///
1502   /// _taskred_item_t red_data[n];
1503   /// ...
1504   /// red_data[i].shar = &shareds[i];
1505   /// red_data[i].orig = &origs[i];
1506   /// red_data[i].size = sizeof(origs[i]);
1507   /// red_data[i].f_init = (void*)RedInit<i>;
1508   /// red_data[i].f_fini = (void*)RedDest<i>;
1509   /// red_data[i].f_comb = (void*)RedOp<i>;
1510   /// red_data[i].flags = <Flag_i>;
1511   /// ...
1512   /// void* tg1 = __kmpc_taskred_modifier_init(loc, gtid, is_worksharing, n,
1513   /// red_data);
1514   /// \endcode
1515   /// \param LHSExprs List of LHS in \a Data.ReductionOps reduction operations.
1516   /// \param RHSExprs List of RHS in \a Data.ReductionOps reduction operations.
1517   /// \param Data Additional data for task generation like tiedness, final
1518   /// state, list of privates, reductions etc.
1519   virtual llvm::Value *emitTaskReductionInit(CodeGenFunction &CGF,
1520                                              SourceLocation Loc,
1521                                              ArrayRef<const Expr *> LHSExprs,
1522                                              ArrayRef<const Expr *> RHSExprs,
1523                                              const OMPTaskDataTy &Data);
1524 
1525   /// Emits the following code for reduction clause with task modifier:
1526   /// \code
1527   /// __kmpc_task_reduction_modifier_fini(loc, gtid, is_worksharing);
1528   /// \endcode
1529   virtual void emitTaskReductionFini(CodeGenFunction &CGF, SourceLocation Loc,
1530                                      bool IsWorksharingReduction);
1531 
1532   /// Required to resolve existing problems in the runtime. Emits threadprivate
1533   /// variables to store the size of the VLAs/array sections for
1534   /// initializer/combiner/finalizer functions.
1535   /// \param RCG Allows to reuse an existing data for the reductions.
1536   /// \param N Reduction item for which fixups must be emitted.
1537   virtual void emitTaskReductionFixups(CodeGenFunction &CGF, SourceLocation Loc,
1538                                        ReductionCodeGen &RCG, unsigned N);
1539 
1540   /// Get the address of `void *` type of the privatue copy of the reduction
1541   /// item specified by the \p SharedLVal.
1542   /// \param ReductionsPtr Pointer to the reduction data returned by the
1543   /// emitTaskReductionInit function.
1544   /// \param SharedLVal Address of the original reduction item.
1545   virtual Address getTaskReductionItem(CodeGenFunction &CGF, SourceLocation Loc,
1546                                        llvm::Value *ReductionsPtr,
1547                                        LValue SharedLVal);
1548 
1549   /// Emit code for 'taskwait' directive.
1550   virtual void emitTaskwaitCall(CodeGenFunction &CGF, SourceLocation Loc,
1551                                 const OMPTaskDataTy &Data);
1552 
1553   /// Emit code for 'cancellation point' construct.
1554   /// \param CancelRegion Region kind for which the cancellation point must be
1555   /// emitted.
1556   ///
1557   virtual void emitCancellationPointCall(CodeGenFunction &CGF,
1558                                          SourceLocation Loc,
1559                                          OpenMPDirectiveKind CancelRegion);
1560 
1561   /// Emit code for 'cancel' construct.
1562   /// \param IfCond Condition in the associated 'if' clause, if it was
1563   /// specified, nullptr otherwise.
1564   /// \param CancelRegion Region kind for which the cancel must be emitted.
1565   ///
1566   virtual void emitCancelCall(CodeGenFunction &CGF, SourceLocation Loc,
1567                               const Expr *IfCond,
1568                               OpenMPDirectiveKind CancelRegion);
1569 
1570   /// Emit outilined function for 'target' directive.
1571   /// \param D Directive to emit.
1572   /// \param ParentName Name of the function that encloses the target region.
1573   /// \param OutlinedFn Outlined function value to be defined by this call.
1574   /// \param OutlinedFnID Outlined function ID value to be defined by this call.
1575   /// \param IsOffloadEntry True if the outlined function is an offload entry.
1576   /// \param CodeGen Code generation sequence for the \a D directive.
1577   /// An outlined function may not be an entry if, e.g. the if clause always
1578   /// evaluates to false.
1579   virtual void emitTargetOutlinedFunction(const OMPExecutableDirective &D,
1580                                           StringRef ParentName,
1581                                           llvm::Function *&OutlinedFn,
1582                                           llvm::Constant *&OutlinedFnID,
1583                                           bool IsOffloadEntry,
1584                                           const RegionCodeGenTy &CodeGen);
1585 
1586   /// Emit the target offloading code associated with \a D. The emitted
1587   /// code attempts offloading the execution to the device, an the event of
1588   /// a failure it executes the host version outlined in \a OutlinedFn.
1589   /// \param D Directive to emit.
1590   /// \param OutlinedFn Host version of the code to be offloaded.
1591   /// \param OutlinedFnID ID of host version of the code to be offloaded.
1592   /// \param IfCond Expression evaluated in if clause associated with the target
1593   /// directive, or null if no if clause is used.
1594   /// \param Device Expression evaluated in device clause associated with the
1595   /// target directive, or null if no device clause is used and device modifier.
1596   /// \param SizeEmitter Callback to emit number of iterations for loop-based
1597   /// directives.
1598   virtual void emitTargetCall(
1599       CodeGenFunction &CGF, const OMPExecutableDirective &D,
1600       llvm::Function *OutlinedFn, llvm::Value *OutlinedFnID, const Expr *IfCond,
1601       llvm::PointerIntPair<const Expr *, 2, OpenMPDeviceClauseModifier> Device,
1602       llvm::function_ref<llvm::Value *(CodeGenFunction &CGF,
1603                                        const OMPLoopDirective &D)>
1604           SizeEmitter);
1605 
1606   /// Emit the target regions enclosed in \a GD function definition or
1607   /// the function itself in case it is a valid device function. Returns true if
1608   /// \a GD was dealt with successfully.
1609   /// \param GD Function to scan.
1610   virtual bool emitTargetFunctions(GlobalDecl GD);
1611 
1612   /// Emit the global variable if it is a valid device global variable.
1613   /// Returns true if \a GD was dealt with successfully.
1614   /// \param GD Variable declaration to emit.
1615   virtual bool emitTargetGlobalVariable(GlobalDecl GD);
1616 
1617   /// Checks if the provided global decl \a GD is a declare target variable and
1618   /// registers it when emitting code for the host.
1619   virtual void registerTargetGlobalVariable(const VarDecl *VD,
1620                                             llvm::Constant *Addr);
1621 
1622   /// Emit the global \a GD if it is meaningful for the target. Returns
1623   /// if it was emitted successfully.
1624   /// \param GD Global to scan.
1625   virtual bool emitTargetGlobal(GlobalDecl GD);
1626 
1627   /// Creates and returns a registration function for when at least one
1628   /// requires directives was used in the current module.
1629   llvm::Function *emitRequiresDirectiveRegFun();
1630 
1631   /// Creates all the offload entries in the current compilation unit
1632   /// along with the associated metadata.
1633   void createOffloadEntriesAndInfoMetadata();
1634 
1635   /// Emits code for teams call of the \a OutlinedFn with
1636   /// variables captured in a record which address is stored in \a
1637   /// CapturedStruct.
1638   /// \param OutlinedFn Outlined function to be run by team masters. Type of
1639   /// this function is void(*)(kmp_int32 *, kmp_int32, struct context_vars*).
1640   /// \param CapturedVars A pointer to the record with the references to
1641   /// variables used in \a OutlinedFn function.
1642   ///
1643   virtual void emitTeamsCall(CodeGenFunction &CGF,
1644                              const OMPExecutableDirective &D,
1645                              SourceLocation Loc, llvm::Function *OutlinedFn,
1646                              ArrayRef<llvm::Value *> CapturedVars);
1647 
1648   /// Emits call to void __kmpc_push_num_teams(ident_t *loc, kmp_int32
1649   /// global_tid, kmp_int32 num_teams, kmp_int32 thread_limit) to generate code
1650   /// for num_teams clause.
1651   /// \param NumTeams An integer expression of teams.
1652   /// \param ThreadLimit An integer expression of threads.
1653   virtual void emitNumTeamsClause(CodeGenFunction &CGF, const Expr *NumTeams,
1654                                   const Expr *ThreadLimit, SourceLocation Loc);
1655 
1656   /// Struct that keeps all the relevant information that should be kept
1657   /// throughout a 'target data' region.
1658   class TargetDataInfo {
1659     /// Set to true if device pointer information have to be obtained.
1660     bool RequiresDevicePointerInfo = false;
1661     /// Set to true if Clang emits separate runtime calls for the beginning and
1662     /// end of the region.  These calls might have separate map type arrays.
1663     bool SeparateBeginEndCalls = false;
1664 
1665   public:
1666     /// The array of base pointer passed to the runtime library.
1667     llvm::Value *BasePointersArray = nullptr;
1668     /// The array of section pointers passed to the runtime library.
1669     llvm::Value *PointersArray = nullptr;
1670     /// The array of sizes passed to the runtime library.
1671     llvm::Value *SizesArray = nullptr;
1672     /// The array of map types passed to the runtime library for the beginning
1673     /// of the region or for the entire region if there are no separate map
1674     /// types for the region end.
1675     llvm::Value *MapTypesArray = nullptr;
1676     /// The array of map types passed to the runtime library for the end of the
1677     /// region, or nullptr if there are no separate map types for the region
1678     /// end.
1679     llvm::Value *MapTypesArrayEnd = nullptr;
1680     /// The array of user-defined mappers passed to the runtime library.
1681     llvm::Value *MappersArray = nullptr;
1682     /// The array of original declaration names of mapped pointers sent to the
1683     /// runtime library for debugging
1684     llvm::Value *MapNamesArray = nullptr;
1685     /// Indicate whether any user-defined mapper exists.
1686     bool HasMapper = false;
1687     /// The total number of pointers passed to the runtime library.
1688     unsigned NumberOfPtrs = 0u;
1689     /// Map between the a declaration of a capture and the corresponding base
1690     /// pointer address where the runtime returns the device pointers.
1691     llvm::DenseMap<const ValueDecl *, Address> CaptureDeviceAddrMap;
1692 
1693     explicit TargetDataInfo() {}
1694     explicit TargetDataInfo(bool RequiresDevicePointerInfo,
1695                             bool SeparateBeginEndCalls)
1696         : RequiresDevicePointerInfo(RequiresDevicePointerInfo),
1697           SeparateBeginEndCalls(SeparateBeginEndCalls) {}
1698     /// Clear information about the data arrays.
1699     void clearArrayInfo() {
1700       BasePointersArray = nullptr;
1701       PointersArray = nullptr;
1702       SizesArray = nullptr;
1703       MapTypesArray = nullptr;
1704       MapTypesArrayEnd = nullptr;
1705       MapNamesArray = nullptr;
1706       MappersArray = nullptr;
1707       HasMapper = false;
1708       NumberOfPtrs = 0u;
1709     }
1710     /// Return true if the current target data information has valid arrays.
1711     bool isValid() {
1712       return BasePointersArray && PointersArray && SizesArray &&
1713              MapTypesArray && (!HasMapper || MappersArray) && NumberOfPtrs;
1714     }
1715     bool requiresDevicePointerInfo() { return RequiresDevicePointerInfo; }
1716     bool separateBeginEndCalls() { return SeparateBeginEndCalls; }
1717   };
1718 
1719   /// Emit the target data mapping code associated with \a D.
1720   /// \param D Directive to emit.
1721   /// \param IfCond Expression evaluated in if clause associated with the
1722   /// target directive, or null if no device clause is used.
1723   /// \param Device Expression evaluated in device clause associated with the
1724   /// target directive, or null if no device clause is used.
1725   /// \param Info A record used to store information that needs to be preserved
1726   /// until the region is closed.
1727   virtual void emitTargetDataCalls(CodeGenFunction &CGF,
1728                                    const OMPExecutableDirective &D,
1729                                    const Expr *IfCond, const Expr *Device,
1730                                    const RegionCodeGenTy &CodeGen,
1731                                    TargetDataInfo &Info);
1732 
1733   /// Emit the data mapping/movement code associated with the directive
1734   /// \a D that should be of the form 'target [{enter|exit} data | update]'.
1735   /// \param D Directive to emit.
1736   /// \param IfCond Expression evaluated in if clause associated with the target
1737   /// directive, or null if no if clause is used.
1738   /// \param Device Expression evaluated in device clause associated with the
1739   /// target directive, or null if no device clause is used.
1740   virtual void emitTargetDataStandAloneCall(CodeGenFunction &CGF,
1741                                             const OMPExecutableDirective &D,
1742                                             const Expr *IfCond,
1743                                             const Expr *Device);
1744 
1745   /// Marks function \a Fn with properly mangled versions of vector functions.
1746   /// \param FD Function marked as 'declare simd'.
1747   /// \param Fn LLVM function that must be marked with 'declare simd'
1748   /// attributes.
1749   virtual void emitDeclareSimdFunction(const FunctionDecl *FD,
1750                                        llvm::Function *Fn);
1751 
1752   /// Emit initialization for doacross loop nesting support.
1753   /// \param D Loop-based construct used in doacross nesting construct.
1754   virtual void emitDoacrossInit(CodeGenFunction &CGF, const OMPLoopDirective &D,
1755                                 ArrayRef<Expr *> NumIterations);
1756 
1757   /// Emit code for doacross ordered directive with 'depend' clause.
1758   /// \param C 'depend' clause with 'sink|source' dependency kind.
1759   virtual void emitDoacrossOrdered(CodeGenFunction &CGF,
1760                                    const OMPDependClause *C);
1761 
1762   /// Translates the native parameter of outlined function if this is required
1763   /// for target.
1764   /// \param FD Field decl from captured record for the parameter.
1765   /// \param NativeParam Parameter itself.
1766   virtual const VarDecl *translateParameter(const FieldDecl *FD,
1767                                             const VarDecl *NativeParam) const {
1768     return NativeParam;
1769   }
1770 
1771   /// Gets the address of the native argument basing on the address of the
1772   /// target-specific parameter.
1773   /// \param NativeParam Parameter itself.
1774   /// \param TargetParam Corresponding target-specific parameter.
1775   virtual Address getParameterAddress(CodeGenFunction &CGF,
1776                                       const VarDecl *NativeParam,
1777                                       const VarDecl *TargetParam) const;
1778 
1779   /// Choose default schedule type and chunk value for the
1780   /// dist_schedule clause.
1781   virtual void getDefaultDistScheduleAndChunk(CodeGenFunction &CGF,
1782       const OMPLoopDirective &S, OpenMPDistScheduleClauseKind &ScheduleKind,
1783       llvm::Value *&Chunk) const {}
1784 
1785   /// Choose default schedule type and chunk value for the
1786   /// schedule clause.
1787   virtual void getDefaultScheduleAndChunk(CodeGenFunction &CGF,
1788       const OMPLoopDirective &S, OpenMPScheduleClauseKind &ScheduleKind,
1789       const Expr *&ChunkExpr) const;
1790 
1791   /// Emits call of the outlined function with the provided arguments,
1792   /// translating these arguments to correct target-specific arguments.
1793   virtual void
1794   emitOutlinedFunctionCall(CodeGenFunction &CGF, SourceLocation Loc,
1795                            llvm::FunctionCallee OutlinedFn,
1796                            ArrayRef<llvm::Value *> Args = llvm::None) const;
1797 
1798   /// Emits OpenMP-specific function prolog.
1799   /// Required for device constructs.
1800   virtual void emitFunctionProlog(CodeGenFunction &CGF, const Decl *D);
1801 
1802   /// Gets the OpenMP-specific address of the local variable.
1803   virtual Address getAddressOfLocalVariable(CodeGenFunction &CGF,
1804                                             const VarDecl *VD);
1805 
1806   /// Marks the declaration as already emitted for the device code and returns
1807   /// true, if it was marked already, and false, otherwise.
1808   bool markAsGlobalTarget(GlobalDecl GD);
1809 
1810   /// Emit deferred declare target variables marked for deferred emission.
1811   void emitDeferredTargetDecls() const;
1812 
1813   /// Adjust some parameters for the target-based directives, like addresses of
1814   /// the variables captured by reference in lambdas.
1815   virtual void
1816   adjustTargetSpecificDataForLambdas(CodeGenFunction &CGF,
1817                                      const OMPExecutableDirective &D) const;
1818 
1819   /// Perform check on requires decl to ensure that target architecture
1820   /// supports unified addressing
1821   virtual void processRequiresDirective(const OMPRequiresDecl *D);
1822 
1823   /// Gets default memory ordering as specified in requires directive.
1824   llvm::AtomicOrdering getDefaultMemoryOrdering() const;
1825 
1826   /// Checks if the variable has associated OMPAllocateDeclAttr attribute with
1827   /// the predefined allocator and translates it into the corresponding address
1828   /// space.
1829   virtual bool hasAllocateAttributeForGlobalVar(const VarDecl *VD, LangAS &AS);
1830 
1831   /// Return whether the unified_shared_memory has been specified.
1832   bool hasRequiresUnifiedSharedMemory() const;
1833 
1834   /// Checks if the \p VD variable is marked as nontemporal declaration in
1835   /// current context.
1836   bool isNontemporalDecl(const ValueDecl *VD) const;
1837 
1838   /// Create specialized alloca to handle lastprivate conditionals.
1839   Address emitLastprivateConditionalInit(CodeGenFunction &CGF,
1840                                          const VarDecl *VD);
1841 
1842   /// Checks if the provided \p LVal is lastprivate conditional and emits the
1843   /// code to update the value of the original variable.
1844   /// \code
1845   /// lastprivate(conditional: a)
1846   /// ...
1847   /// <type> a;
1848   /// lp_a = ...;
1849   /// #pragma omp critical(a)
1850   /// if (last_iv_a <= iv) {
1851   ///   last_iv_a = iv;
1852   ///   global_a = lp_a;
1853   /// }
1854   /// \endcode
1855   virtual void checkAndEmitLastprivateConditional(CodeGenFunction &CGF,
1856                                                   const Expr *LHS);
1857 
1858   /// Checks if the lastprivate conditional was updated in inner region and
1859   /// writes the value.
1860   /// \code
1861   /// lastprivate(conditional: a)
1862   /// ...
1863   /// <type> a;bool Fired = false;
1864   /// #pragma omp ... shared(a)
1865   /// {
1866   ///   lp_a = ...;
1867   ///   Fired = true;
1868   /// }
1869   /// if (Fired) {
1870   ///   #pragma omp critical(a)
1871   ///   if (last_iv_a <= iv) {
1872   ///     last_iv_a = iv;
1873   ///     global_a = lp_a;
1874   ///   }
1875   ///   Fired = false;
1876   /// }
1877   /// \endcode
1878   virtual void checkAndEmitSharedLastprivateConditional(
1879       CodeGenFunction &CGF, const OMPExecutableDirective &D,
1880       const llvm::DenseSet<CanonicalDeclPtr<const VarDecl>> &IgnoredDecls);
1881 
1882   /// Gets the address of the global copy used for lastprivate conditional
1883   /// update, if any.
1884   /// \param PrivLVal LValue for the private copy.
1885   /// \param VD Original lastprivate declaration.
1886   virtual void emitLastprivateConditionalFinalUpdate(CodeGenFunction &CGF,
1887                                                      LValue PrivLVal,
1888                                                      const VarDecl *VD,
1889                                                      SourceLocation Loc);
1890 
1891   /// Emits list of dependecies based on the provided data (array of
1892   /// dependence/expression pairs).
1893   /// \returns Pointer to the first element of the array casted to VoidPtr type.
1894   std::pair<llvm::Value *, Address>
1895   emitDependClause(CodeGenFunction &CGF,
1896                    ArrayRef<OMPTaskDataTy::DependData> Dependencies,
1897                    SourceLocation Loc);
1898 
1899   /// Emits list of dependecies based on the provided data (array of
1900   /// dependence/expression pairs) for depobj construct. In this case, the
1901   /// variable is allocated in dynamically. \returns Pointer to the first
1902   /// element of the array casted to VoidPtr type.
1903   Address emitDepobjDependClause(CodeGenFunction &CGF,
1904                                  const OMPTaskDataTy::DependData &Dependencies,
1905                                  SourceLocation Loc);
1906 
1907   /// Emits the code to destroy the dependency object provided in depobj
1908   /// directive.
1909   void emitDestroyClause(CodeGenFunction &CGF, LValue DepobjLVal,
1910                          SourceLocation Loc);
1911 
1912   /// Updates the dependency kind in the specified depobj object.
1913   /// \param DepobjLVal LValue for the main depobj object.
1914   /// \param NewDepKind New dependency kind.
1915   void emitUpdateClause(CodeGenFunction &CGF, LValue DepobjLVal,
1916                         OpenMPDependClauseKind NewDepKind, SourceLocation Loc);
1917 
1918   /// Initializes user defined allocators specified in the uses_allocators
1919   /// clauses.
1920   void emitUsesAllocatorsInit(CodeGenFunction &CGF, const Expr *Allocator,
1921                               const Expr *AllocatorTraits);
1922 
1923   /// Destroys user defined allocators specified in the uses_allocators clause.
1924   void emitUsesAllocatorsFini(CodeGenFunction &CGF, const Expr *Allocator);
1925 
1926   /// Returns true if the variable is a local variable in untied task.
1927   bool isLocalVarInUntiedTask(CodeGenFunction &CGF, const VarDecl *VD) const;
1928 };
1929 
1930 /// Class supports emissionof SIMD-only code.
1931 class CGOpenMPSIMDRuntime final : public CGOpenMPRuntime {
1932 public:
1933   explicit CGOpenMPSIMDRuntime(CodeGenModule &CGM) : CGOpenMPRuntime(CGM) {}
1934   ~CGOpenMPSIMDRuntime() override {}
1935 
1936   /// Emits outlined function for the specified OpenMP parallel directive
1937   /// \a D. This outlined function has type void(*)(kmp_int32 *ThreadID,
1938   /// kmp_int32 BoundID, struct context_vars*).
1939   /// \param D OpenMP directive.
1940   /// \param ThreadIDVar Variable for thread id in the current OpenMP region.
1941   /// \param InnermostKind Kind of innermost directive (for simple directives it
1942   /// is a directive itself, for combined - its innermost directive).
1943   /// \param CodeGen Code generation sequence for the \a D directive.
1944   llvm::Function *
1945   emitParallelOutlinedFunction(const OMPExecutableDirective &D,
1946                                const VarDecl *ThreadIDVar,
1947                                OpenMPDirectiveKind InnermostKind,
1948                                const RegionCodeGenTy &CodeGen) override;
1949 
1950   /// Emits outlined function for the specified OpenMP teams directive
1951   /// \a D. This outlined function has type void(*)(kmp_int32 *ThreadID,
1952   /// kmp_int32 BoundID, struct context_vars*).
1953   /// \param D OpenMP directive.
1954   /// \param ThreadIDVar Variable for thread id in the current OpenMP region.
1955   /// \param InnermostKind Kind of innermost directive (for simple directives it
1956   /// is a directive itself, for combined - its innermost directive).
1957   /// \param CodeGen Code generation sequence for the \a D directive.
1958   llvm::Function *
1959   emitTeamsOutlinedFunction(const OMPExecutableDirective &D,
1960                             const VarDecl *ThreadIDVar,
1961                             OpenMPDirectiveKind InnermostKind,
1962                             const RegionCodeGenTy &CodeGen) override;
1963 
1964   /// Emits outlined function for the OpenMP task directive \a D. This
1965   /// outlined function has type void(*)(kmp_int32 ThreadID, struct task_t*
1966   /// TaskT).
1967   /// \param D OpenMP directive.
1968   /// \param ThreadIDVar Variable for thread id in the current OpenMP region.
1969   /// \param PartIDVar Variable for partition id in the current OpenMP untied
1970   /// task region.
1971   /// \param TaskTVar Variable for task_t argument.
1972   /// \param InnermostKind Kind of innermost directive (for simple directives it
1973   /// is a directive itself, for combined - its innermost directive).
1974   /// \param CodeGen Code generation sequence for the \a D directive.
1975   /// \param Tied true if task is generated for tied task, false otherwise.
1976   /// \param NumberOfParts Number of parts in untied task. Ignored for tied
1977   /// tasks.
1978   ///
1979   llvm::Function *emitTaskOutlinedFunction(
1980       const OMPExecutableDirective &D, const VarDecl *ThreadIDVar,
1981       const VarDecl *PartIDVar, const VarDecl *TaskTVar,
1982       OpenMPDirectiveKind InnermostKind, const RegionCodeGenTy &CodeGen,
1983       bool Tied, unsigned &NumberOfParts) override;
1984 
1985   /// Emits code for parallel or serial call of the \a OutlinedFn with
1986   /// variables captured in a record which address is stored in \a
1987   /// CapturedStruct.
1988   /// \param OutlinedFn Outlined function to be run in parallel threads. Type of
1989   /// this function is void(*)(kmp_int32 *, kmp_int32, struct context_vars*).
1990   /// \param CapturedVars A pointer to the record with the references to
1991   /// variables used in \a OutlinedFn function.
1992   /// \param IfCond Condition in the associated 'if' clause, if it was
1993   /// specified, nullptr otherwise.
1994   ///
1995   void emitParallelCall(CodeGenFunction &CGF, SourceLocation Loc,
1996                         llvm::Function *OutlinedFn,
1997                         ArrayRef<llvm::Value *> CapturedVars,
1998                         const Expr *IfCond) override;
1999 
2000   /// Emits a critical region.
2001   /// \param CriticalName Name of the critical region.
2002   /// \param CriticalOpGen Generator for the statement associated with the given
2003   /// critical region.
2004   /// \param Hint Value of the 'hint' clause (optional).
2005   void emitCriticalRegion(CodeGenFunction &CGF, StringRef CriticalName,
2006                           const RegionCodeGenTy &CriticalOpGen,
2007                           SourceLocation Loc,
2008                           const Expr *Hint = nullptr) override;
2009 
2010   /// Emits a master region.
2011   /// \param MasterOpGen Generator for the statement associated with the given
2012   /// master region.
2013   void emitMasterRegion(CodeGenFunction &CGF,
2014                         const RegionCodeGenTy &MasterOpGen,
2015                         SourceLocation Loc) override;
2016 
2017   /// Emits a masked region.
2018   /// \param MaskedOpGen Generator for the statement associated with the given
2019   /// masked region.
2020   void emitMaskedRegion(CodeGenFunction &CGF,
2021                         const RegionCodeGenTy &MaskedOpGen, SourceLocation Loc,
2022                         const Expr *Filter = nullptr) override;
2023 
2024   /// Emits a masked region.
2025   /// \param MaskedOpGen Generator for the statement associated with the given
2026   /// masked region.
2027 
2028   /// Emits code for a taskyield directive.
2029   void emitTaskyieldCall(CodeGenFunction &CGF, SourceLocation Loc) override;
2030 
2031   /// Emit a taskgroup region.
2032   /// \param TaskgroupOpGen Generator for the statement associated with the
2033   /// given taskgroup region.
2034   void emitTaskgroupRegion(CodeGenFunction &CGF,
2035                            const RegionCodeGenTy &TaskgroupOpGen,
2036                            SourceLocation Loc) override;
2037 
2038   /// Emits a single region.
2039   /// \param SingleOpGen Generator for the statement associated with the given
2040   /// single region.
2041   void emitSingleRegion(CodeGenFunction &CGF,
2042                         const RegionCodeGenTy &SingleOpGen, SourceLocation Loc,
2043                         ArrayRef<const Expr *> CopyprivateVars,
2044                         ArrayRef<const Expr *> DestExprs,
2045                         ArrayRef<const Expr *> SrcExprs,
2046                         ArrayRef<const Expr *> AssignmentOps) override;
2047 
2048   /// Emit an ordered region.
2049   /// \param OrderedOpGen Generator for the statement associated with the given
2050   /// ordered region.
2051   void emitOrderedRegion(CodeGenFunction &CGF,
2052                          const RegionCodeGenTy &OrderedOpGen,
2053                          SourceLocation Loc, bool IsThreads) override;
2054 
2055   /// Emit an implicit/explicit barrier for OpenMP threads.
2056   /// \param Kind Directive for which this implicit barrier call must be
2057   /// generated. Must be OMPD_barrier for explicit barrier generation.
2058   /// \param EmitChecks true if need to emit checks for cancellation barriers.
2059   /// \param ForceSimpleCall true simple barrier call must be emitted, false if
2060   /// runtime class decides which one to emit (simple or with cancellation
2061   /// checks).
2062   ///
2063   void emitBarrierCall(CodeGenFunction &CGF, SourceLocation Loc,
2064                        OpenMPDirectiveKind Kind, bool EmitChecks = true,
2065                        bool ForceSimpleCall = false) override;
2066 
2067   /// This is used for non static scheduled types and when the ordered
2068   /// clause is present on the loop construct.
2069   /// Depending on the loop schedule, it is necessary to call some runtime
2070   /// routine before start of the OpenMP loop to get the loop upper / lower
2071   /// bounds \a LB and \a UB and stride \a ST.
2072   ///
2073   /// \param CGF Reference to current CodeGenFunction.
2074   /// \param Loc Clang source location.
2075   /// \param ScheduleKind Schedule kind, specified by the 'schedule' clause.
2076   /// \param IVSize Size of the iteration variable in bits.
2077   /// \param IVSigned Sign of the iteration variable.
2078   /// \param Ordered true if loop is ordered, false otherwise.
2079   /// \param DispatchValues struct containing llvm values for lower bound, upper
2080   /// bound, and chunk expression.
2081   /// For the default (nullptr) value, the chunk 1 will be used.
2082   ///
2083   void emitForDispatchInit(CodeGenFunction &CGF, SourceLocation Loc,
2084                            const OpenMPScheduleTy &ScheduleKind,
2085                            unsigned IVSize, bool IVSigned, bool Ordered,
2086                            const DispatchRTInput &DispatchValues) override;
2087 
2088   /// Call the appropriate runtime routine to initialize it before start
2089   /// of loop.
2090   ///
2091   /// This is used only in case of static schedule, when the user did not
2092   /// specify a ordered clause on the loop construct.
2093   /// Depending on the loop schedule, it is necessary to call some runtime
2094   /// routine before start of the OpenMP loop to get the loop upper / lower
2095   /// bounds LB and UB and stride ST.
2096   ///
2097   /// \param CGF Reference to current CodeGenFunction.
2098   /// \param Loc Clang source location.
2099   /// \param DKind Kind of the directive.
2100   /// \param ScheduleKind Schedule kind, specified by the 'schedule' clause.
2101   /// \param Values Input arguments for the construct.
2102   ///
2103   void emitForStaticInit(CodeGenFunction &CGF, SourceLocation Loc,
2104                          OpenMPDirectiveKind DKind,
2105                          const OpenMPScheduleTy &ScheduleKind,
2106                          const StaticRTInput &Values) override;
2107 
2108   ///
2109   /// \param CGF Reference to current CodeGenFunction.
2110   /// \param Loc Clang source location.
2111   /// \param SchedKind Schedule kind, specified by the 'dist_schedule' clause.
2112   /// \param Values Input arguments for the construct.
2113   ///
2114   void emitDistributeStaticInit(CodeGenFunction &CGF, SourceLocation Loc,
2115                                 OpenMPDistScheduleClauseKind SchedKind,
2116                                 const StaticRTInput &Values) override;
2117 
2118   /// Call the appropriate runtime routine to notify that we finished
2119   /// iteration of the ordered loop with the dynamic scheduling.
2120   ///
2121   /// \param CGF Reference to current CodeGenFunction.
2122   /// \param Loc Clang source location.
2123   /// \param IVSize Size of the iteration variable in bits.
2124   /// \param IVSigned Sign of the iteration variable.
2125   ///
2126   void emitForOrderedIterationEnd(CodeGenFunction &CGF, SourceLocation Loc,
2127                                   unsigned IVSize, bool IVSigned) override;
2128 
2129   /// Call the appropriate runtime routine to notify that we finished
2130   /// all the work with current loop.
2131   ///
2132   /// \param CGF Reference to current CodeGenFunction.
2133   /// \param Loc Clang source location.
2134   /// \param DKind Kind of the directive for which the static finish is emitted.
2135   ///
2136   void emitForStaticFinish(CodeGenFunction &CGF, SourceLocation Loc,
2137                            OpenMPDirectiveKind DKind) override;
2138 
2139   /// Call __kmpc_dispatch_next(
2140   ///          ident_t *loc, kmp_int32 tid, kmp_int32 *p_lastiter,
2141   ///          kmp_int[32|64] *p_lower, kmp_int[32|64] *p_upper,
2142   ///          kmp_int[32|64] *p_stride);
2143   /// \param IVSize Size of the iteration variable in bits.
2144   /// \param IVSigned Sign of the iteration variable.
2145   /// \param IL Address of the output variable in which the flag of the
2146   /// last iteration is returned.
2147   /// \param LB Address of the output variable in which the lower iteration
2148   /// number is returned.
2149   /// \param UB Address of the output variable in which the upper iteration
2150   /// number is returned.
2151   /// \param ST Address of the output variable in which the stride value is
2152   /// returned.
2153   llvm::Value *emitForNext(CodeGenFunction &CGF, SourceLocation Loc,
2154                            unsigned IVSize, bool IVSigned, Address IL,
2155                            Address LB, Address UB, Address ST) override;
2156 
2157   /// Emits call to void __kmpc_push_num_threads(ident_t *loc, kmp_int32
2158   /// global_tid, kmp_int32 num_threads) to generate code for 'num_threads'
2159   /// clause.
2160   /// \param NumThreads An integer value of threads.
2161   void emitNumThreadsClause(CodeGenFunction &CGF, llvm::Value *NumThreads,
2162                             SourceLocation Loc) override;
2163 
2164   /// Emit call to void __kmpc_push_proc_bind(ident_t *loc, kmp_int32
2165   /// global_tid, int proc_bind) to generate code for 'proc_bind' clause.
2166   void emitProcBindClause(CodeGenFunction &CGF,
2167                           llvm::omp::ProcBindKind ProcBind,
2168                           SourceLocation Loc) override;
2169 
2170   /// Returns address of the threadprivate variable for the current
2171   /// thread.
2172   /// \param VD Threadprivate variable.
2173   /// \param VDAddr Address of the global variable \a VD.
2174   /// \param Loc Location of the reference to threadprivate var.
2175   /// \return Address of the threadprivate variable for the current thread.
2176   Address getAddrOfThreadPrivate(CodeGenFunction &CGF, const VarDecl *VD,
2177                                  Address VDAddr, SourceLocation Loc) override;
2178 
2179   /// Emit a code for initialization of threadprivate variable. It emits
2180   /// a call to runtime library which adds initial value to the newly created
2181   /// threadprivate variable (if it is not constant) and registers destructor
2182   /// for the variable (if any).
2183   /// \param VD Threadprivate variable.
2184   /// \param VDAddr Address of the global variable \a VD.
2185   /// \param Loc Location of threadprivate declaration.
2186   /// \param PerformInit true if initialization expression is not constant.
2187   llvm::Function *
2188   emitThreadPrivateVarDefinition(const VarDecl *VD, Address VDAddr,
2189                                  SourceLocation Loc, bool PerformInit,
2190                                  CodeGenFunction *CGF = nullptr) override;
2191 
2192   /// Creates artificial threadprivate variable with name \p Name and type \p
2193   /// VarType.
2194   /// \param VarType Type of the artificial threadprivate variable.
2195   /// \param Name Name of the artificial threadprivate variable.
2196   Address getAddrOfArtificialThreadPrivate(CodeGenFunction &CGF,
2197                                            QualType VarType,
2198                                            StringRef Name) override;
2199 
2200   /// Emit flush of the variables specified in 'omp flush' directive.
2201   /// \param Vars List of variables to flush.
2202   void emitFlush(CodeGenFunction &CGF, ArrayRef<const Expr *> Vars,
2203                  SourceLocation Loc, llvm::AtomicOrdering AO) override;
2204 
2205   /// Emit task region for the task directive. The task region is
2206   /// emitted in several steps:
2207   /// 1. Emit a call to kmp_task_t *__kmpc_omp_task_alloc(ident_t *, kmp_int32
2208   /// gtid, kmp_int32 flags, size_t sizeof_kmp_task_t, size_t sizeof_shareds,
2209   /// kmp_routine_entry_t *task_entry). Here task_entry is a pointer to the
2210   /// function:
2211   /// kmp_int32 .omp_task_entry.(kmp_int32 gtid, kmp_task_t *tt) {
2212   ///   TaskFunction(gtid, tt->part_id, tt->shareds);
2213   ///   return 0;
2214   /// }
2215   /// 2. Copy a list of shared variables to field shareds of the resulting
2216   /// structure kmp_task_t returned by the previous call (if any).
2217   /// 3. Copy a pointer to destructions function to field destructions of the
2218   /// resulting structure kmp_task_t.
2219   /// 4. Emit a call to kmp_int32 __kmpc_omp_task(ident_t *, kmp_int32 gtid,
2220   /// kmp_task_t *new_task), where new_task is a resulting structure from
2221   /// previous items.
2222   /// \param D Current task directive.
2223   /// \param TaskFunction An LLVM function with type void (*)(i32 /*gtid*/, i32
2224   /// /*part_id*/, captured_struct */*__context*/);
2225   /// \param SharedsTy A type which contains references the shared variables.
2226   /// \param Shareds Context with the list of shared variables from the \p
2227   /// TaskFunction.
2228   /// \param IfCond Not a nullptr if 'if' clause was specified, nullptr
2229   /// otherwise.
2230   /// \param Data Additional data for task generation like tiednsee, final
2231   /// state, list of privates etc.
2232   void emitTaskCall(CodeGenFunction &CGF, SourceLocation Loc,
2233                     const OMPExecutableDirective &D,
2234                     llvm::Function *TaskFunction, QualType SharedsTy,
2235                     Address Shareds, const Expr *IfCond,
2236                     const OMPTaskDataTy &Data) override;
2237 
2238   /// Emit task region for the taskloop directive. The taskloop region is
2239   /// emitted in several steps:
2240   /// 1. Emit a call to kmp_task_t *__kmpc_omp_task_alloc(ident_t *, kmp_int32
2241   /// gtid, kmp_int32 flags, size_t sizeof_kmp_task_t, size_t sizeof_shareds,
2242   /// kmp_routine_entry_t *task_entry). Here task_entry is a pointer to the
2243   /// function:
2244   /// kmp_int32 .omp_task_entry.(kmp_int32 gtid, kmp_task_t *tt) {
2245   ///   TaskFunction(gtid, tt->part_id, tt->shareds);
2246   ///   return 0;
2247   /// }
2248   /// 2. Copy a list of shared variables to field shareds of the resulting
2249   /// structure kmp_task_t returned by the previous call (if any).
2250   /// 3. Copy a pointer to destructions function to field destructions of the
2251   /// resulting structure kmp_task_t.
2252   /// 4. Emit a call to void __kmpc_taskloop(ident_t *loc, int gtid, kmp_task_t
2253   /// *task, int if_val, kmp_uint64 *lb, kmp_uint64 *ub, kmp_int64 st, int
2254   /// nogroup, int sched, kmp_uint64 grainsize, void *task_dup ), where new_task
2255   /// is a resulting structure from
2256   /// previous items.
2257   /// \param D Current task directive.
2258   /// \param TaskFunction An LLVM function with type void (*)(i32 /*gtid*/, i32
2259   /// /*part_id*/, captured_struct */*__context*/);
2260   /// \param SharedsTy A type which contains references the shared variables.
2261   /// \param Shareds Context with the list of shared variables from the \p
2262   /// TaskFunction.
2263   /// \param IfCond Not a nullptr if 'if' clause was specified, nullptr
2264   /// otherwise.
2265   /// \param Data Additional data for task generation like tiednsee, final
2266   /// state, list of privates etc.
2267   void emitTaskLoopCall(CodeGenFunction &CGF, SourceLocation Loc,
2268                         const OMPLoopDirective &D, llvm::Function *TaskFunction,
2269                         QualType SharedsTy, Address Shareds, const Expr *IfCond,
2270                         const OMPTaskDataTy &Data) override;
2271 
2272   /// Emit a code for reduction clause. Next code should be emitted for
2273   /// reduction:
2274   /// \code
2275   ///
2276   /// static kmp_critical_name lock = { 0 };
2277   ///
2278   /// void reduce_func(void *lhs[<n>], void *rhs[<n>]) {
2279   ///  ...
2280   ///  *(Type<i>*)lhs[i] = RedOp<i>(*(Type<i>*)lhs[i], *(Type<i>*)rhs[i]);
2281   ///  ...
2282   /// }
2283   ///
2284   /// ...
2285   /// void *RedList[<n>] = {&<RHSExprs>[0], ..., &<RHSExprs>[<n>-1]};
2286   /// switch (__kmpc_reduce{_nowait}(<loc>, <gtid>, <n>, sizeof(RedList),
2287   /// RedList, reduce_func, &<lock>)) {
2288   /// case 1:
2289   ///  ...
2290   ///  <LHSExprs>[i] = RedOp<i>(*<LHSExprs>[i], *<RHSExprs>[i]);
2291   ///  ...
2292   /// __kmpc_end_reduce{_nowait}(<loc>, <gtid>, &<lock>);
2293   /// break;
2294   /// case 2:
2295   ///  ...
2296   ///  Atomic(<LHSExprs>[i] = RedOp<i>(*<LHSExprs>[i], *<RHSExprs>[i]));
2297   ///  ...
2298   /// break;
2299   /// default:;
2300   /// }
2301   /// \endcode
2302   ///
2303   /// \param Privates List of private copies for original reduction arguments.
2304   /// \param LHSExprs List of LHS in \a ReductionOps reduction operations.
2305   /// \param RHSExprs List of RHS in \a ReductionOps reduction operations.
2306   /// \param ReductionOps List of reduction operations in form 'LHS binop RHS'
2307   /// or 'operator binop(LHS, RHS)'.
2308   /// \param Options List of options for reduction codegen:
2309   ///     WithNowait true if parent directive has also nowait clause, false
2310   ///     otherwise.
2311   ///     SimpleReduction Emit reduction operation only. Used for omp simd
2312   ///     directive on the host.
2313   ///     ReductionKind The kind of reduction to perform.
2314   void emitReduction(CodeGenFunction &CGF, SourceLocation Loc,
2315                      ArrayRef<const Expr *> Privates,
2316                      ArrayRef<const Expr *> LHSExprs,
2317                      ArrayRef<const Expr *> RHSExprs,
2318                      ArrayRef<const Expr *> ReductionOps,
2319                      ReductionOptionsTy Options) override;
2320 
2321   /// Emit a code for initialization of task reduction clause. Next code
2322   /// should be emitted for reduction:
2323   /// \code
2324   ///
2325   /// _taskred_item_t red_data[n];
2326   /// ...
2327   /// red_data[i].shar = &shareds[i];
2328   /// red_data[i].orig = &origs[i];
2329   /// red_data[i].size = sizeof(origs[i]);
2330   /// red_data[i].f_init = (void*)RedInit<i>;
2331   /// red_data[i].f_fini = (void*)RedDest<i>;
2332   /// red_data[i].f_comb = (void*)RedOp<i>;
2333   /// red_data[i].flags = <Flag_i>;
2334   /// ...
2335   /// void* tg1 = __kmpc_taskred_init(gtid, n, red_data);
2336   /// \endcode
2337   /// For reduction clause with task modifier it emits the next call:
2338   /// \code
2339   ///
2340   /// _taskred_item_t red_data[n];
2341   /// ...
2342   /// red_data[i].shar = &shareds[i];
2343   /// red_data[i].orig = &origs[i];
2344   /// red_data[i].size = sizeof(origs[i]);
2345   /// red_data[i].f_init = (void*)RedInit<i>;
2346   /// red_data[i].f_fini = (void*)RedDest<i>;
2347   /// red_data[i].f_comb = (void*)RedOp<i>;
2348   /// red_data[i].flags = <Flag_i>;
2349   /// ...
2350   /// void* tg1 = __kmpc_taskred_modifier_init(loc, gtid, is_worksharing, n,
2351   /// red_data);
2352   /// \endcode
2353   /// \param LHSExprs List of LHS in \a Data.ReductionOps reduction operations.
2354   /// \param RHSExprs List of RHS in \a Data.ReductionOps reduction operations.
2355   /// \param Data Additional data for task generation like tiedness, final
2356   /// state, list of privates, reductions etc.
2357   llvm::Value *emitTaskReductionInit(CodeGenFunction &CGF, SourceLocation Loc,
2358                                      ArrayRef<const Expr *> LHSExprs,
2359                                      ArrayRef<const Expr *> RHSExprs,
2360                                      const OMPTaskDataTy &Data) override;
2361 
2362   /// Emits the following code for reduction clause with task modifier:
2363   /// \code
2364   /// __kmpc_task_reduction_modifier_fini(loc, gtid, is_worksharing);
2365   /// \endcode
2366   void emitTaskReductionFini(CodeGenFunction &CGF, SourceLocation Loc,
2367                              bool IsWorksharingReduction) override;
2368 
2369   /// Required to resolve existing problems in the runtime. Emits threadprivate
2370   /// variables to store the size of the VLAs/array sections for
2371   /// initializer/combiner/finalizer functions + emits threadprivate variable to
2372   /// store the pointer to the original reduction item for the custom
2373   /// initializer defined by declare reduction construct.
2374   /// \param RCG Allows to reuse an existing data for the reductions.
2375   /// \param N Reduction item for which fixups must be emitted.
2376   void emitTaskReductionFixups(CodeGenFunction &CGF, SourceLocation Loc,
2377                                ReductionCodeGen &RCG, unsigned N) override;
2378 
2379   /// Get the address of `void *` type of the privatue copy of the reduction
2380   /// item specified by the \p SharedLVal.
2381   /// \param ReductionsPtr Pointer to the reduction data returned by the
2382   /// emitTaskReductionInit function.
2383   /// \param SharedLVal Address of the original reduction item.
2384   Address getTaskReductionItem(CodeGenFunction &CGF, SourceLocation Loc,
2385                                llvm::Value *ReductionsPtr,
2386                                LValue SharedLVal) override;
2387 
2388   /// Emit code for 'taskwait' directive.
2389   void emitTaskwaitCall(CodeGenFunction &CGF, SourceLocation Loc,
2390                         const OMPTaskDataTy &Data) override;
2391 
2392   /// Emit code for 'cancellation point' construct.
2393   /// \param CancelRegion Region kind for which the cancellation point must be
2394   /// emitted.
2395   ///
2396   void emitCancellationPointCall(CodeGenFunction &CGF, SourceLocation Loc,
2397                                  OpenMPDirectiveKind CancelRegion) override;
2398 
2399   /// Emit code for 'cancel' construct.
2400   /// \param IfCond Condition in the associated 'if' clause, if it was
2401   /// specified, nullptr otherwise.
2402   /// \param CancelRegion Region kind for which the cancel must be emitted.
2403   ///
2404   void emitCancelCall(CodeGenFunction &CGF, SourceLocation Loc,
2405                       const Expr *IfCond,
2406                       OpenMPDirectiveKind CancelRegion) override;
2407 
2408   /// Emit outilined function for 'target' directive.
2409   /// \param D Directive to emit.
2410   /// \param ParentName Name of the function that encloses the target region.
2411   /// \param OutlinedFn Outlined function value to be defined by this call.
2412   /// \param OutlinedFnID Outlined function ID value to be defined by this call.
2413   /// \param IsOffloadEntry True if the outlined function is an offload entry.
2414   /// \param CodeGen Code generation sequence for the \a D directive.
2415   /// An outlined function may not be an entry if, e.g. the if clause always
2416   /// evaluates to false.
2417   void emitTargetOutlinedFunction(const OMPExecutableDirective &D,
2418                                   StringRef ParentName,
2419                                   llvm::Function *&OutlinedFn,
2420                                   llvm::Constant *&OutlinedFnID,
2421                                   bool IsOffloadEntry,
2422                                   const RegionCodeGenTy &CodeGen) override;
2423 
2424   /// Emit the target offloading code associated with \a D. The emitted
2425   /// code attempts offloading the execution to the device, an the event of
2426   /// a failure it executes the host version outlined in \a OutlinedFn.
2427   /// \param D Directive to emit.
2428   /// \param OutlinedFn Host version of the code to be offloaded.
2429   /// \param OutlinedFnID ID of host version of the code to be offloaded.
2430   /// \param IfCond Expression evaluated in if clause associated with the target
2431   /// directive, or null if no if clause is used.
2432   /// \param Device Expression evaluated in device clause associated with the
2433   /// target directive, or null if no device clause is used and device modifier.
2434   void emitTargetCall(
2435       CodeGenFunction &CGF, const OMPExecutableDirective &D,
2436       llvm::Function *OutlinedFn, llvm::Value *OutlinedFnID, const Expr *IfCond,
2437       llvm::PointerIntPair<const Expr *, 2, OpenMPDeviceClauseModifier> Device,
2438       llvm::function_ref<llvm::Value *(CodeGenFunction &CGF,
2439                                        const OMPLoopDirective &D)>
2440           SizeEmitter) override;
2441 
2442   /// Emit the target regions enclosed in \a GD function definition or
2443   /// the function itself in case it is a valid device function. Returns true if
2444   /// \a GD was dealt with successfully.
2445   /// \param GD Function to scan.
2446   bool emitTargetFunctions(GlobalDecl GD) override;
2447 
2448   /// Emit the global variable if it is a valid device global variable.
2449   /// Returns true if \a GD was dealt with successfully.
2450   /// \param GD Variable declaration to emit.
2451   bool emitTargetGlobalVariable(GlobalDecl GD) override;
2452 
2453   /// Emit the global \a GD if it is meaningful for the target. Returns
2454   /// if it was emitted successfully.
2455   /// \param GD Global to scan.
2456   bool emitTargetGlobal(GlobalDecl GD) override;
2457 
2458   /// Emits code for teams call of the \a OutlinedFn with
2459   /// variables captured in a record which address is stored in \a
2460   /// CapturedStruct.
2461   /// \param OutlinedFn Outlined function to be run by team masters. Type of
2462   /// this function is void(*)(kmp_int32 *, kmp_int32, struct context_vars*).
2463   /// \param CapturedVars A pointer to the record with the references to
2464   /// variables used in \a OutlinedFn function.
2465   ///
2466   void emitTeamsCall(CodeGenFunction &CGF, const OMPExecutableDirective &D,
2467                      SourceLocation Loc, llvm::Function *OutlinedFn,
2468                      ArrayRef<llvm::Value *> CapturedVars) override;
2469 
2470   /// Emits call to void __kmpc_push_num_teams(ident_t *loc, kmp_int32
2471   /// global_tid, kmp_int32 num_teams, kmp_int32 thread_limit) to generate code
2472   /// for num_teams clause.
2473   /// \param NumTeams An integer expression of teams.
2474   /// \param ThreadLimit An integer expression of threads.
2475   void emitNumTeamsClause(CodeGenFunction &CGF, const Expr *NumTeams,
2476                           const Expr *ThreadLimit, SourceLocation Loc) override;
2477 
2478   /// Emit the target data mapping code associated with \a D.
2479   /// \param D Directive to emit.
2480   /// \param IfCond Expression evaluated in if clause associated with the
2481   /// target directive, or null if no device clause is used.
2482   /// \param Device Expression evaluated in device clause associated with the
2483   /// target directive, or null if no device clause is used.
2484   /// \param Info A record used to store information that needs to be preserved
2485   /// until the region is closed.
2486   void emitTargetDataCalls(CodeGenFunction &CGF,
2487                            const OMPExecutableDirective &D, const Expr *IfCond,
2488                            const Expr *Device, const RegionCodeGenTy &CodeGen,
2489                            TargetDataInfo &Info) override;
2490 
2491   /// Emit the data mapping/movement code associated with the directive
2492   /// \a D that should be of the form 'target [{enter|exit} data | update]'.
2493   /// \param D Directive to emit.
2494   /// \param IfCond Expression evaluated in if clause associated with the target
2495   /// directive, or null if no if clause is used.
2496   /// \param Device Expression evaluated in device clause associated with the
2497   /// target directive, or null if no device clause is used.
2498   void emitTargetDataStandAloneCall(CodeGenFunction &CGF,
2499                                     const OMPExecutableDirective &D,
2500                                     const Expr *IfCond,
2501                                     const Expr *Device) override;
2502 
2503   /// Emit initialization for doacross loop nesting support.
2504   /// \param D Loop-based construct used in doacross nesting construct.
2505   void emitDoacrossInit(CodeGenFunction &CGF, const OMPLoopDirective &D,
2506                         ArrayRef<Expr *> NumIterations) override;
2507 
2508   /// Emit code for doacross ordered directive with 'depend' clause.
2509   /// \param C 'depend' clause with 'sink|source' dependency kind.
2510   void emitDoacrossOrdered(CodeGenFunction &CGF,
2511                            const OMPDependClause *C) override;
2512 
2513   /// Translates the native parameter of outlined function if this is required
2514   /// for target.
2515   /// \param FD Field decl from captured record for the parameter.
2516   /// \param NativeParam Parameter itself.
2517   const VarDecl *translateParameter(const FieldDecl *FD,
2518                                     const VarDecl *NativeParam) const override;
2519 
2520   /// Gets the address of the native argument basing on the address of the
2521   /// target-specific parameter.
2522   /// \param NativeParam Parameter itself.
2523   /// \param TargetParam Corresponding target-specific parameter.
2524   Address getParameterAddress(CodeGenFunction &CGF, const VarDecl *NativeParam,
2525                               const VarDecl *TargetParam) const override;
2526 
2527   /// Gets the OpenMP-specific address of the local variable.
2528   Address getAddressOfLocalVariable(CodeGenFunction &CGF,
2529                                     const VarDecl *VD) override {
2530     return Address::invalid();
2531   }
2532 };
2533 
2534 } // namespace CodeGen
2535 } // namespace clang
2536 
2537 #endif
2538