xref: /freebsd/contrib/llvm-project/llvm/lib/IR/ConstantFold.cpp (revision 0fca6ea1d4eea4c934cfff25ac9ee8ad6fe95583)
1 //===- ConstantFold.cpp - LLVM constant folder ----------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements folding of constants for LLVM.  This implements the
10 // (internal) ConstantFold.h interface, which is used by the
11 // ConstantExpr::get* methods to automatically fold constants when possible.
12 //
13 // The current constant folding implementation is implemented in two pieces: the
14 // pieces that don't need DataLayout, and the pieces that do. This is to avoid
15 // a dependence in IR on Target.
16 //
17 //===----------------------------------------------------------------------===//
18 
19 #include "llvm/IR/ConstantFold.h"
20 #include "llvm/ADT/APSInt.h"
21 #include "llvm/ADT/SmallVector.h"
22 #include "llvm/IR/Constants.h"
23 #include "llvm/IR/DerivedTypes.h"
24 #include "llvm/IR/Function.h"
25 #include "llvm/IR/GetElementPtrTypeIterator.h"
26 #include "llvm/IR/GlobalAlias.h"
27 #include "llvm/IR/GlobalVariable.h"
28 #include "llvm/IR/Instructions.h"
29 #include "llvm/IR/Module.h"
30 #include "llvm/IR/Operator.h"
31 #include "llvm/IR/PatternMatch.h"
32 #include "llvm/Support/ErrorHandling.h"
33 using namespace llvm;
34 using namespace llvm::PatternMatch;
35 
36 //===----------------------------------------------------------------------===//
37 //                ConstantFold*Instruction Implementations
38 //===----------------------------------------------------------------------===//
39 
40 /// This function determines which opcode to use to fold two constant cast
41 /// expressions together. It uses CastInst::isEliminableCastPair to determine
42 /// the opcode. Consequently its just a wrapper around that function.
43 /// Determine if it is valid to fold a cast of a cast
44 static unsigned
foldConstantCastPair(unsigned opc,ConstantExpr * Op,Type * DstTy)45 foldConstantCastPair(
46   unsigned opc,          ///< opcode of the second cast constant expression
47   ConstantExpr *Op,      ///< the first cast constant expression
48   Type *DstTy            ///< destination type of the first cast
49 ) {
50   assert(Op && Op->isCast() && "Can't fold cast of cast without a cast!");
51   assert(DstTy && DstTy->isFirstClassType() && "Invalid cast destination type");
52   assert(CastInst::isCast(opc) && "Invalid cast opcode");
53 
54   // The types and opcodes for the two Cast constant expressions
55   Type *SrcTy = Op->getOperand(0)->getType();
56   Type *MidTy = Op->getType();
57   Instruction::CastOps firstOp = Instruction::CastOps(Op->getOpcode());
58   Instruction::CastOps secondOp = Instruction::CastOps(opc);
59 
60   // Assume that pointers are never more than 64 bits wide, and only use this
61   // for the middle type. Otherwise we could end up folding away illegal
62   // bitcasts between address spaces with different sizes.
63   IntegerType *FakeIntPtrTy = Type::getInt64Ty(DstTy->getContext());
64 
65   // Let CastInst::isEliminableCastPair do the heavy lifting.
66   return CastInst::isEliminableCastPair(firstOp, secondOp, SrcTy, MidTy, DstTy,
67                                         nullptr, FakeIntPtrTy, nullptr);
68 }
69 
FoldBitCast(Constant * V,Type * DestTy)70 static Constant *FoldBitCast(Constant *V, Type *DestTy) {
71   Type *SrcTy = V->getType();
72   if (SrcTy == DestTy)
73     return V; // no-op cast
74 
75   // Handle casts from one vector constant to another.  We know that the src
76   // and dest type have the same size (otherwise its an illegal cast).
77   if (VectorType *DestPTy = dyn_cast<VectorType>(DestTy)) {
78     if (V->isAllOnesValue())
79       return Constant::getAllOnesValue(DestTy);
80 
81     // Canonicalize scalar-to-vector bitcasts into vector-to-vector bitcasts
82     // This allows for other simplifications (although some of them
83     // can only be handled by Analysis/ConstantFolding.cpp).
84     if (isa<ConstantInt>(V) || isa<ConstantFP>(V))
85       return ConstantExpr::getBitCast(ConstantVector::get(V), DestPTy);
86     return nullptr;
87   }
88 
89   // Handle integral constant input.
90   if (ConstantInt *CI = dyn_cast<ConstantInt>(V)) {
91     // See note below regarding the PPC_FP128 restriction.
92     if (DestTy->isFloatingPointTy() && !DestTy->isPPC_FP128Ty())
93       return ConstantFP::get(DestTy->getContext(),
94                              APFloat(DestTy->getFltSemantics(),
95                                      CI->getValue()));
96 
97     // Otherwise, can't fold this (vector?)
98     return nullptr;
99   }
100 
101   // Handle ConstantFP input: FP -> Integral.
102   if (ConstantFP *FP = dyn_cast<ConstantFP>(V)) {
103     // PPC_FP128 is really the sum of two consecutive doubles, where the first
104     // double is always stored first in memory, regardless of the target
105     // endianness. The memory layout of i128, however, depends on the target
106     // endianness, and so we can't fold this without target endianness
107     // information. This should instead be handled by
108     // Analysis/ConstantFolding.cpp
109     if (FP->getType()->isPPC_FP128Ty())
110       return nullptr;
111 
112     // Make sure dest type is compatible with the folded integer constant.
113     if (!DestTy->isIntegerTy())
114       return nullptr;
115 
116     return ConstantInt::get(FP->getContext(),
117                             FP->getValueAPF().bitcastToAPInt());
118   }
119 
120   return nullptr;
121 }
122 
foldMaybeUndesirableCast(unsigned opc,Constant * V,Type * DestTy)123 static Constant *foldMaybeUndesirableCast(unsigned opc, Constant *V,
124                                           Type *DestTy) {
125   return ConstantExpr::isDesirableCastOp(opc)
126              ? ConstantExpr::getCast(opc, V, DestTy)
127              : ConstantFoldCastInstruction(opc, V, DestTy);
128 }
129 
ConstantFoldCastInstruction(unsigned opc,Constant * V,Type * DestTy)130 Constant *llvm::ConstantFoldCastInstruction(unsigned opc, Constant *V,
131                                             Type *DestTy) {
132   if (isa<PoisonValue>(V))
133     return PoisonValue::get(DestTy);
134 
135   if (isa<UndefValue>(V)) {
136     // zext(undef) = 0, because the top bits will be zero.
137     // sext(undef) = 0, because the top bits will all be the same.
138     // [us]itofp(undef) = 0, because the result value is bounded.
139     if (opc == Instruction::ZExt || opc == Instruction::SExt ||
140         opc == Instruction::UIToFP || opc == Instruction::SIToFP)
141       return Constant::getNullValue(DestTy);
142     return UndefValue::get(DestTy);
143   }
144 
145   if (V->isNullValue() && !DestTy->isX86_MMXTy() && !DestTy->isX86_AMXTy() &&
146       opc != Instruction::AddrSpaceCast)
147     return Constant::getNullValue(DestTy);
148 
149   // If the cast operand is a constant expression, there's a few things we can
150   // do to try to simplify it.
151   if (ConstantExpr *CE = dyn_cast<ConstantExpr>(V)) {
152     if (CE->isCast()) {
153       // Try hard to fold cast of cast because they are often eliminable.
154       if (unsigned newOpc = foldConstantCastPair(opc, CE, DestTy))
155         return foldMaybeUndesirableCast(newOpc, CE->getOperand(0), DestTy);
156     }
157   }
158 
159   // If the cast operand is a constant vector, perform the cast by
160   // operating on each element. In the cast of bitcasts, the element
161   // count may be mismatched; don't attempt to handle that here.
162   if ((isa<ConstantVector>(V) || isa<ConstantDataVector>(V)) &&
163       DestTy->isVectorTy() &&
164       cast<FixedVectorType>(DestTy)->getNumElements() ==
165           cast<FixedVectorType>(V->getType())->getNumElements()) {
166     VectorType *DestVecTy = cast<VectorType>(DestTy);
167     Type *DstEltTy = DestVecTy->getElementType();
168     // Fast path for splatted constants.
169     if (Constant *Splat = V->getSplatValue()) {
170       Constant *Res = foldMaybeUndesirableCast(opc, Splat, DstEltTy);
171       if (!Res)
172         return nullptr;
173       return ConstantVector::getSplat(
174           cast<VectorType>(DestTy)->getElementCount(), Res);
175     }
176     SmallVector<Constant *, 16> res;
177     Type *Ty = IntegerType::get(V->getContext(), 32);
178     for (unsigned i = 0,
179                   e = cast<FixedVectorType>(V->getType())->getNumElements();
180          i != e; ++i) {
181       Constant *C = ConstantExpr::getExtractElement(V, ConstantInt::get(Ty, i));
182       Constant *Casted = foldMaybeUndesirableCast(opc, C, DstEltTy);
183       if (!Casted)
184         return nullptr;
185       res.push_back(Casted);
186     }
187     return ConstantVector::get(res);
188   }
189 
190   // We actually have to do a cast now. Perform the cast according to the
191   // opcode specified.
192   switch (opc) {
193   default:
194     llvm_unreachable("Failed to cast constant expression");
195   case Instruction::FPTrunc:
196   case Instruction::FPExt:
197     if (ConstantFP *FPC = dyn_cast<ConstantFP>(V)) {
198       bool ignored;
199       APFloat Val = FPC->getValueAPF();
200       Val.convert(DestTy->getFltSemantics(), APFloat::rmNearestTiesToEven,
201                   &ignored);
202       return ConstantFP::get(V->getContext(), Val);
203     }
204     return nullptr; // Can't fold.
205   case Instruction::FPToUI:
206   case Instruction::FPToSI:
207     if (ConstantFP *FPC = dyn_cast<ConstantFP>(V)) {
208       const APFloat &V = FPC->getValueAPF();
209       bool ignored;
210       uint32_t DestBitWidth = cast<IntegerType>(DestTy)->getBitWidth();
211       APSInt IntVal(DestBitWidth, opc == Instruction::FPToUI);
212       if (APFloat::opInvalidOp ==
213           V.convertToInteger(IntVal, APFloat::rmTowardZero, &ignored)) {
214         // Undefined behavior invoked - the destination type can't represent
215         // the input constant.
216         return PoisonValue::get(DestTy);
217       }
218       return ConstantInt::get(FPC->getContext(), IntVal);
219     }
220     return nullptr; // Can't fold.
221   case Instruction::UIToFP:
222   case Instruction::SIToFP:
223     if (ConstantInt *CI = dyn_cast<ConstantInt>(V)) {
224       const APInt &api = CI->getValue();
225       APFloat apf(DestTy->getFltSemantics(),
226                   APInt::getZero(DestTy->getPrimitiveSizeInBits()));
227       apf.convertFromAPInt(api, opc==Instruction::SIToFP,
228                            APFloat::rmNearestTiesToEven);
229       return ConstantFP::get(V->getContext(), apf);
230     }
231     return nullptr;
232   case Instruction::ZExt:
233     if (ConstantInt *CI = dyn_cast<ConstantInt>(V)) {
234       uint32_t BitWidth = cast<IntegerType>(DestTy)->getBitWidth();
235       return ConstantInt::get(V->getContext(),
236                               CI->getValue().zext(BitWidth));
237     }
238     return nullptr;
239   case Instruction::SExt:
240     if (ConstantInt *CI = dyn_cast<ConstantInt>(V)) {
241       uint32_t BitWidth = cast<IntegerType>(DestTy)->getBitWidth();
242       return ConstantInt::get(V->getContext(),
243                               CI->getValue().sext(BitWidth));
244     }
245     return nullptr;
246   case Instruction::Trunc: {
247     if (V->getType()->isVectorTy())
248       return nullptr;
249 
250     uint32_t DestBitWidth = cast<IntegerType>(DestTy)->getBitWidth();
251     if (ConstantInt *CI = dyn_cast<ConstantInt>(V)) {
252       return ConstantInt::get(V->getContext(),
253                               CI->getValue().trunc(DestBitWidth));
254     }
255 
256     return nullptr;
257   }
258   case Instruction::BitCast:
259     return FoldBitCast(V, DestTy);
260   case Instruction::AddrSpaceCast:
261   case Instruction::IntToPtr:
262   case Instruction::PtrToInt:
263     return nullptr;
264   }
265 }
266 
ConstantFoldSelectInstruction(Constant * Cond,Constant * V1,Constant * V2)267 Constant *llvm::ConstantFoldSelectInstruction(Constant *Cond,
268                                               Constant *V1, Constant *V2) {
269   // Check for i1 and vector true/false conditions.
270   if (Cond->isNullValue()) return V2;
271   if (Cond->isAllOnesValue()) return V1;
272 
273   // If the condition is a vector constant, fold the result elementwise.
274   if (ConstantVector *CondV = dyn_cast<ConstantVector>(Cond)) {
275     auto *V1VTy = CondV->getType();
276     SmallVector<Constant*, 16> Result;
277     Type *Ty = IntegerType::get(CondV->getContext(), 32);
278     for (unsigned i = 0, e = V1VTy->getNumElements(); i != e; ++i) {
279       Constant *V;
280       Constant *V1Element = ConstantExpr::getExtractElement(V1,
281                                                     ConstantInt::get(Ty, i));
282       Constant *V2Element = ConstantExpr::getExtractElement(V2,
283                                                     ConstantInt::get(Ty, i));
284       auto *Cond = cast<Constant>(CondV->getOperand(i));
285       if (isa<PoisonValue>(Cond)) {
286         V = PoisonValue::get(V1Element->getType());
287       } else if (V1Element == V2Element) {
288         V = V1Element;
289       } else if (isa<UndefValue>(Cond)) {
290         V = isa<UndefValue>(V1Element) ? V1Element : V2Element;
291       } else {
292         if (!isa<ConstantInt>(Cond)) break;
293         V = Cond->isNullValue() ? V2Element : V1Element;
294       }
295       Result.push_back(V);
296     }
297 
298     // If we were able to build the vector, return it.
299     if (Result.size() == V1VTy->getNumElements())
300       return ConstantVector::get(Result);
301   }
302 
303   if (isa<PoisonValue>(Cond))
304     return PoisonValue::get(V1->getType());
305 
306   if (isa<UndefValue>(Cond)) {
307     if (isa<UndefValue>(V1)) return V1;
308     return V2;
309   }
310 
311   if (V1 == V2) return V1;
312 
313   if (isa<PoisonValue>(V1))
314     return V2;
315   if (isa<PoisonValue>(V2))
316     return V1;
317 
318   // If the true or false value is undef, we can fold to the other value as
319   // long as the other value isn't poison.
320   auto NotPoison = [](Constant *C) {
321     if (isa<PoisonValue>(C))
322       return false;
323 
324     // TODO: We can analyze ConstExpr by opcode to determine if there is any
325     //       possibility of poison.
326     if (isa<ConstantExpr>(C))
327       return false;
328 
329     if (isa<ConstantInt>(C) || isa<GlobalVariable>(C) || isa<ConstantFP>(C) ||
330         isa<ConstantPointerNull>(C) || isa<Function>(C))
331       return true;
332 
333     if (C->getType()->isVectorTy())
334       return !C->containsPoisonElement() && !C->containsConstantExpression();
335 
336     // TODO: Recursively analyze aggregates or other constants.
337     return false;
338   };
339   if (isa<UndefValue>(V1) && NotPoison(V2)) return V2;
340   if (isa<UndefValue>(V2) && NotPoison(V1)) return V1;
341 
342   return nullptr;
343 }
344 
ConstantFoldExtractElementInstruction(Constant * Val,Constant * Idx)345 Constant *llvm::ConstantFoldExtractElementInstruction(Constant *Val,
346                                                       Constant *Idx) {
347   auto *ValVTy = cast<VectorType>(Val->getType());
348 
349   // extractelt poison, C -> poison
350   // extractelt C, undef -> poison
351   if (isa<PoisonValue>(Val) || isa<UndefValue>(Idx))
352     return PoisonValue::get(ValVTy->getElementType());
353 
354   // extractelt undef, C -> undef
355   if (isa<UndefValue>(Val))
356     return UndefValue::get(ValVTy->getElementType());
357 
358   auto *CIdx = dyn_cast<ConstantInt>(Idx);
359   if (!CIdx)
360     return nullptr;
361 
362   if (auto *ValFVTy = dyn_cast<FixedVectorType>(Val->getType())) {
363     // ee({w,x,y,z}, wrong_value) -> poison
364     if (CIdx->uge(ValFVTy->getNumElements()))
365       return PoisonValue::get(ValFVTy->getElementType());
366   }
367 
368   // ee (gep (ptr, idx0, ...), idx) -> gep (ee (ptr, idx), ee (idx0, idx), ...)
369   if (auto *CE = dyn_cast<ConstantExpr>(Val)) {
370     if (auto *GEP = dyn_cast<GEPOperator>(CE)) {
371       SmallVector<Constant *, 8> Ops;
372       Ops.reserve(CE->getNumOperands());
373       for (unsigned i = 0, e = CE->getNumOperands(); i != e; ++i) {
374         Constant *Op = CE->getOperand(i);
375         if (Op->getType()->isVectorTy()) {
376           Constant *ScalarOp = ConstantExpr::getExtractElement(Op, Idx);
377           if (!ScalarOp)
378             return nullptr;
379           Ops.push_back(ScalarOp);
380         } else
381           Ops.push_back(Op);
382       }
383       return CE->getWithOperands(Ops, ValVTy->getElementType(), false,
384                                  GEP->getSourceElementType());
385     } else if (CE->getOpcode() == Instruction::InsertElement) {
386       if (const auto *IEIdx = dyn_cast<ConstantInt>(CE->getOperand(2))) {
387         if (APSInt::isSameValue(APSInt(IEIdx->getValue()),
388                                 APSInt(CIdx->getValue()))) {
389           return CE->getOperand(1);
390         } else {
391           return ConstantExpr::getExtractElement(CE->getOperand(0), CIdx);
392         }
393       }
394     }
395   }
396 
397   if (Constant *C = Val->getAggregateElement(CIdx))
398     return C;
399 
400   // Lane < Splat minimum vector width => extractelt Splat(x), Lane -> x
401   if (CIdx->getValue().ult(ValVTy->getElementCount().getKnownMinValue())) {
402     if (Constant *SplatVal = Val->getSplatValue())
403       return SplatVal;
404   }
405 
406   return nullptr;
407 }
408 
ConstantFoldInsertElementInstruction(Constant * Val,Constant * Elt,Constant * Idx)409 Constant *llvm::ConstantFoldInsertElementInstruction(Constant *Val,
410                                                      Constant *Elt,
411                                                      Constant *Idx) {
412   if (isa<UndefValue>(Idx))
413     return PoisonValue::get(Val->getType());
414 
415   // Inserting null into all zeros is still all zeros.
416   // TODO: This is true for undef and poison splats too.
417   if (isa<ConstantAggregateZero>(Val) && Elt->isNullValue())
418     return Val;
419 
420   ConstantInt *CIdx = dyn_cast<ConstantInt>(Idx);
421   if (!CIdx) return nullptr;
422 
423   // Do not iterate on scalable vector. The num of elements is unknown at
424   // compile-time.
425   if (isa<ScalableVectorType>(Val->getType()))
426     return nullptr;
427 
428   auto *ValTy = cast<FixedVectorType>(Val->getType());
429 
430   unsigned NumElts = ValTy->getNumElements();
431   if (CIdx->uge(NumElts))
432     return PoisonValue::get(Val->getType());
433 
434   SmallVector<Constant*, 16> Result;
435   Result.reserve(NumElts);
436   auto *Ty = Type::getInt32Ty(Val->getContext());
437   uint64_t IdxVal = CIdx->getZExtValue();
438   for (unsigned i = 0; i != NumElts; ++i) {
439     if (i == IdxVal) {
440       Result.push_back(Elt);
441       continue;
442     }
443 
444     Constant *C = ConstantExpr::getExtractElement(Val, ConstantInt::get(Ty, i));
445     Result.push_back(C);
446   }
447 
448   return ConstantVector::get(Result);
449 }
450 
ConstantFoldShuffleVectorInstruction(Constant * V1,Constant * V2,ArrayRef<int> Mask)451 Constant *llvm::ConstantFoldShuffleVectorInstruction(Constant *V1, Constant *V2,
452                                                      ArrayRef<int> Mask) {
453   auto *V1VTy = cast<VectorType>(V1->getType());
454   unsigned MaskNumElts = Mask.size();
455   auto MaskEltCount =
456       ElementCount::get(MaskNumElts, isa<ScalableVectorType>(V1VTy));
457   Type *EltTy = V1VTy->getElementType();
458 
459   // Poison shuffle mask -> poison value.
460   if (all_of(Mask, [](int Elt) { return Elt == PoisonMaskElem; })) {
461     return PoisonValue::get(VectorType::get(EltTy, MaskEltCount));
462   }
463 
464   // If the mask is all zeros this is a splat, no need to go through all
465   // elements.
466   if (all_of(Mask, [](int Elt) { return Elt == 0; })) {
467     Type *Ty = IntegerType::get(V1->getContext(), 32);
468     Constant *Elt =
469         ConstantExpr::getExtractElement(V1, ConstantInt::get(Ty, 0));
470 
471     if (Elt->isNullValue()) {
472       auto *VTy = VectorType::get(EltTy, MaskEltCount);
473       return ConstantAggregateZero::get(VTy);
474     } else if (!MaskEltCount.isScalable())
475       return ConstantVector::getSplat(MaskEltCount, Elt);
476   }
477 
478   // Do not iterate on scalable vector. The num of elements is unknown at
479   // compile-time.
480   if (isa<ScalableVectorType>(V1VTy))
481     return nullptr;
482 
483   unsigned SrcNumElts = V1VTy->getElementCount().getKnownMinValue();
484 
485   // Loop over the shuffle mask, evaluating each element.
486   SmallVector<Constant*, 32> Result;
487   for (unsigned i = 0; i != MaskNumElts; ++i) {
488     int Elt = Mask[i];
489     if (Elt == -1) {
490       Result.push_back(UndefValue::get(EltTy));
491       continue;
492     }
493     Constant *InElt;
494     if (unsigned(Elt) >= SrcNumElts*2)
495       InElt = UndefValue::get(EltTy);
496     else if (unsigned(Elt) >= SrcNumElts) {
497       Type *Ty = IntegerType::get(V2->getContext(), 32);
498       InElt =
499         ConstantExpr::getExtractElement(V2,
500                                         ConstantInt::get(Ty, Elt - SrcNumElts));
501     } else {
502       Type *Ty = IntegerType::get(V1->getContext(), 32);
503       InElt = ConstantExpr::getExtractElement(V1, ConstantInt::get(Ty, Elt));
504     }
505     Result.push_back(InElt);
506   }
507 
508   return ConstantVector::get(Result);
509 }
510 
ConstantFoldExtractValueInstruction(Constant * Agg,ArrayRef<unsigned> Idxs)511 Constant *llvm::ConstantFoldExtractValueInstruction(Constant *Agg,
512                                                     ArrayRef<unsigned> Idxs) {
513   // Base case: no indices, so return the entire value.
514   if (Idxs.empty())
515     return Agg;
516 
517   if (Constant *C = Agg->getAggregateElement(Idxs[0]))
518     return ConstantFoldExtractValueInstruction(C, Idxs.slice(1));
519 
520   return nullptr;
521 }
522 
ConstantFoldInsertValueInstruction(Constant * Agg,Constant * Val,ArrayRef<unsigned> Idxs)523 Constant *llvm::ConstantFoldInsertValueInstruction(Constant *Agg,
524                                                    Constant *Val,
525                                                    ArrayRef<unsigned> Idxs) {
526   // Base case: no indices, so replace the entire value.
527   if (Idxs.empty())
528     return Val;
529 
530   unsigned NumElts;
531   if (StructType *ST = dyn_cast<StructType>(Agg->getType()))
532     NumElts = ST->getNumElements();
533   else
534     NumElts = cast<ArrayType>(Agg->getType())->getNumElements();
535 
536   SmallVector<Constant*, 32> Result;
537   for (unsigned i = 0; i != NumElts; ++i) {
538     Constant *C = Agg->getAggregateElement(i);
539     if (!C) return nullptr;
540 
541     if (Idxs[0] == i)
542       C = ConstantFoldInsertValueInstruction(C, Val, Idxs.slice(1));
543 
544     Result.push_back(C);
545   }
546 
547   if (StructType *ST = dyn_cast<StructType>(Agg->getType()))
548     return ConstantStruct::get(ST, Result);
549   return ConstantArray::get(cast<ArrayType>(Agg->getType()), Result);
550 }
551 
ConstantFoldUnaryInstruction(unsigned Opcode,Constant * C)552 Constant *llvm::ConstantFoldUnaryInstruction(unsigned Opcode, Constant *C) {
553   assert(Instruction::isUnaryOp(Opcode) && "Non-unary instruction detected");
554 
555   // Handle scalar UndefValue and scalable vector UndefValue. Fixed-length
556   // vectors are always evaluated per element.
557   bool IsScalableVector = isa<ScalableVectorType>(C->getType());
558   bool HasScalarUndefOrScalableVectorUndef =
559       (!C->getType()->isVectorTy() || IsScalableVector) && isa<UndefValue>(C);
560 
561   if (HasScalarUndefOrScalableVectorUndef) {
562     switch (static_cast<Instruction::UnaryOps>(Opcode)) {
563     case Instruction::FNeg:
564       return C; // -undef -> undef
565     case Instruction::UnaryOpsEnd:
566       llvm_unreachable("Invalid UnaryOp");
567     }
568   }
569 
570   // Constant should not be UndefValue, unless these are vector constants.
571   assert(!HasScalarUndefOrScalableVectorUndef && "Unexpected UndefValue");
572   // We only have FP UnaryOps right now.
573   assert(!isa<ConstantInt>(C) && "Unexpected Integer UnaryOp");
574 
575   if (ConstantFP *CFP = dyn_cast<ConstantFP>(C)) {
576     const APFloat &CV = CFP->getValueAPF();
577     switch (Opcode) {
578     default:
579       break;
580     case Instruction::FNeg:
581       return ConstantFP::get(C->getContext(), neg(CV));
582     }
583   } else if (auto *VTy = dyn_cast<FixedVectorType>(C->getType())) {
584 
585     Type *Ty = IntegerType::get(VTy->getContext(), 32);
586     // Fast path for splatted constants.
587     if (Constant *Splat = C->getSplatValue())
588       if (Constant *Elt = ConstantFoldUnaryInstruction(Opcode, Splat))
589         return ConstantVector::getSplat(VTy->getElementCount(), Elt);
590 
591     // Fold each element and create a vector constant from those constants.
592     SmallVector<Constant *, 16> Result;
593     for (unsigned i = 0, e = VTy->getNumElements(); i != e; ++i) {
594       Constant *ExtractIdx = ConstantInt::get(Ty, i);
595       Constant *Elt = ConstantExpr::getExtractElement(C, ExtractIdx);
596       Constant *Res = ConstantFoldUnaryInstruction(Opcode, Elt);
597       if (!Res)
598         return nullptr;
599       Result.push_back(Res);
600     }
601 
602     return ConstantVector::get(Result);
603   }
604 
605   // We don't know how to fold this.
606   return nullptr;
607 }
608 
ConstantFoldBinaryInstruction(unsigned Opcode,Constant * C1,Constant * C2)609 Constant *llvm::ConstantFoldBinaryInstruction(unsigned Opcode, Constant *C1,
610                                               Constant *C2) {
611   assert(Instruction::isBinaryOp(Opcode) && "Non-binary instruction detected");
612 
613   // Simplify BinOps with their identity values first. They are no-ops and we
614   // can always return the other value, including undef or poison values.
615   if (Constant *Identity = ConstantExpr::getBinOpIdentity(
616           Opcode, C1->getType(), /*AllowRHSIdentity*/ false)) {
617     if (C1 == Identity)
618       return C2;
619     if (C2 == Identity)
620       return C1;
621   } else if (Constant *Identity = ConstantExpr::getBinOpIdentity(
622                  Opcode, C1->getType(), /*AllowRHSIdentity*/ true)) {
623     if (C2 == Identity)
624       return C1;
625   }
626 
627   // Binary operations propagate poison.
628   if (isa<PoisonValue>(C1) || isa<PoisonValue>(C2))
629     return PoisonValue::get(C1->getType());
630 
631   // Handle scalar UndefValue and scalable vector UndefValue. Fixed-length
632   // vectors are always evaluated per element.
633   bool IsScalableVector = isa<ScalableVectorType>(C1->getType());
634   bool HasScalarUndefOrScalableVectorUndef =
635       (!C1->getType()->isVectorTy() || IsScalableVector) &&
636       (isa<UndefValue>(C1) || isa<UndefValue>(C2));
637   if (HasScalarUndefOrScalableVectorUndef) {
638     switch (static_cast<Instruction::BinaryOps>(Opcode)) {
639     case Instruction::Xor:
640       if (isa<UndefValue>(C1) && isa<UndefValue>(C2))
641         // Handle undef ^ undef -> 0 special case. This is a common
642         // idiom (misuse).
643         return Constant::getNullValue(C1->getType());
644       [[fallthrough]];
645     case Instruction::Add:
646     case Instruction::Sub:
647       return UndefValue::get(C1->getType());
648     case Instruction::And:
649       if (isa<UndefValue>(C1) && isa<UndefValue>(C2)) // undef & undef -> undef
650         return C1;
651       return Constant::getNullValue(C1->getType());   // undef & X -> 0
652     case Instruction::Mul: {
653       // undef * undef -> undef
654       if (isa<UndefValue>(C1) && isa<UndefValue>(C2))
655         return C1;
656       const APInt *CV;
657       // X * undef -> undef   if X is odd
658       if (match(C1, m_APInt(CV)) || match(C2, m_APInt(CV)))
659         if ((*CV)[0])
660           return UndefValue::get(C1->getType());
661 
662       // X * undef -> 0       otherwise
663       return Constant::getNullValue(C1->getType());
664     }
665     case Instruction::SDiv:
666     case Instruction::UDiv:
667       // X / undef -> poison
668       // X / 0 -> poison
669       if (match(C2, m_CombineOr(m_Undef(), m_Zero())))
670         return PoisonValue::get(C2->getType());
671       // undef / X -> 0       otherwise
672       return Constant::getNullValue(C1->getType());
673     case Instruction::URem:
674     case Instruction::SRem:
675       // X % undef -> poison
676       // X % 0 -> poison
677       if (match(C2, m_CombineOr(m_Undef(), m_Zero())))
678         return PoisonValue::get(C2->getType());
679       // undef % X -> 0       otherwise
680       return Constant::getNullValue(C1->getType());
681     case Instruction::Or:                          // X | undef -> -1
682       if (isa<UndefValue>(C1) && isa<UndefValue>(C2)) // undef | undef -> undef
683         return C1;
684       return Constant::getAllOnesValue(C1->getType()); // undef | X -> ~0
685     case Instruction::LShr:
686       // X >>l undef -> poison
687       if (isa<UndefValue>(C2))
688         return PoisonValue::get(C2->getType());
689       // undef >>l X -> 0
690       return Constant::getNullValue(C1->getType());
691     case Instruction::AShr:
692       // X >>a undef -> poison
693       if (isa<UndefValue>(C2))
694         return PoisonValue::get(C2->getType());
695       // TODO: undef >>a X -> poison if the shift is exact
696       // undef >>a X -> 0
697       return Constant::getNullValue(C1->getType());
698     case Instruction::Shl:
699       // X << undef -> undef
700       if (isa<UndefValue>(C2))
701         return PoisonValue::get(C2->getType());
702       // undef << X -> 0
703       return Constant::getNullValue(C1->getType());
704     case Instruction::FSub:
705       // -0.0 - undef --> undef (consistent with "fneg undef")
706       if (match(C1, m_NegZeroFP()) && isa<UndefValue>(C2))
707         return C2;
708       [[fallthrough]];
709     case Instruction::FAdd:
710     case Instruction::FMul:
711     case Instruction::FDiv:
712     case Instruction::FRem:
713       // [any flop] undef, undef -> undef
714       if (isa<UndefValue>(C1) && isa<UndefValue>(C2))
715         return C1;
716       // [any flop] C, undef -> NaN
717       // [any flop] undef, C -> NaN
718       // We could potentially specialize NaN/Inf constants vs. 'normal'
719       // constants (possibly differently depending on opcode and operand). This
720       // would allow returning undef sometimes. But it is always safe to fold to
721       // NaN because we can choose the undef operand as NaN, and any FP opcode
722       // with a NaN operand will propagate NaN.
723       return ConstantFP::getNaN(C1->getType());
724     case Instruction::BinaryOpsEnd:
725       llvm_unreachable("Invalid BinaryOp");
726     }
727   }
728 
729   // Neither constant should be UndefValue, unless these are vector constants.
730   assert((!HasScalarUndefOrScalableVectorUndef) && "Unexpected UndefValue");
731 
732   // Handle simplifications when the RHS is a constant int.
733   if (ConstantInt *CI2 = dyn_cast<ConstantInt>(C2)) {
734     switch (Opcode) {
735     case Instruction::Mul:
736       if (CI2->isZero())
737         return C2; // X * 0 == 0
738       break;
739     case Instruction::UDiv:
740     case Instruction::SDiv:
741       if (CI2->isZero())
742         return PoisonValue::get(CI2->getType());              // X / 0 == poison
743       break;
744     case Instruction::URem:
745     case Instruction::SRem:
746       if (CI2->isOne())
747         return Constant::getNullValue(CI2->getType());        // X % 1 == 0
748       if (CI2->isZero())
749         return PoisonValue::get(CI2->getType());              // X % 0 == poison
750       break;
751     case Instruction::And:
752       if (CI2->isZero())
753         return C2; // X & 0 == 0
754 
755       if (ConstantExpr *CE1 = dyn_cast<ConstantExpr>(C1)) {
756         // If and'ing the address of a global with a constant, fold it.
757         if (CE1->getOpcode() == Instruction::PtrToInt &&
758             isa<GlobalValue>(CE1->getOperand(0))) {
759           GlobalValue *GV = cast<GlobalValue>(CE1->getOperand(0));
760 
761           Align GVAlign; // defaults to 1
762 
763           if (Module *TheModule = GV->getParent()) {
764             const DataLayout &DL = TheModule->getDataLayout();
765             GVAlign = GV->getPointerAlignment(DL);
766 
767             // If the function alignment is not specified then assume that it
768             // is 4.
769             // This is dangerous; on x86, the alignment of the pointer
770             // corresponds to the alignment of the function, but might be less
771             // than 4 if it isn't explicitly specified.
772             // However, a fix for this behaviour was reverted because it
773             // increased code size (see https://reviews.llvm.org/D55115)
774             // FIXME: This code should be deleted once existing targets have
775             // appropriate defaults
776             if (isa<Function>(GV) && !DL.getFunctionPtrAlign())
777               GVAlign = Align(4);
778           } else if (isa<GlobalVariable>(GV)) {
779             GVAlign = cast<GlobalVariable>(GV)->getAlign().valueOrOne();
780           }
781 
782           if (GVAlign > 1) {
783             unsigned DstWidth = CI2->getBitWidth();
784             unsigned SrcWidth = std::min(DstWidth, Log2(GVAlign));
785             APInt BitsNotSet(APInt::getLowBitsSet(DstWidth, SrcWidth));
786 
787             // If checking bits we know are clear, return zero.
788             if ((CI2->getValue() & BitsNotSet) == CI2->getValue())
789               return Constant::getNullValue(CI2->getType());
790           }
791         }
792       }
793       break;
794     case Instruction::Or:
795       if (CI2->isMinusOne())
796         return C2; // X | -1 == -1
797       break;
798     }
799   } else if (isa<ConstantInt>(C1)) {
800     // If C1 is a ConstantInt and C2 is not, swap the operands.
801     if (Instruction::isCommutative(Opcode))
802       return ConstantExpr::isDesirableBinOp(Opcode)
803                  ? ConstantExpr::get(Opcode, C2, C1)
804                  : ConstantFoldBinaryInstruction(Opcode, C2, C1);
805   }
806 
807   if (ConstantInt *CI1 = dyn_cast<ConstantInt>(C1)) {
808     if (ConstantInt *CI2 = dyn_cast<ConstantInt>(C2)) {
809       const APInt &C1V = CI1->getValue();
810       const APInt &C2V = CI2->getValue();
811       switch (Opcode) {
812       default:
813         break;
814       case Instruction::Add:
815         return ConstantInt::get(CI1->getContext(), C1V + C2V);
816       case Instruction::Sub:
817         return ConstantInt::get(CI1->getContext(), C1V - C2V);
818       case Instruction::Mul:
819         return ConstantInt::get(CI1->getContext(), C1V * C2V);
820       case Instruction::UDiv:
821         assert(!CI2->isZero() && "Div by zero handled above");
822         return ConstantInt::get(CI1->getContext(), C1V.udiv(C2V));
823       case Instruction::SDiv:
824         assert(!CI2->isZero() && "Div by zero handled above");
825         if (C2V.isAllOnes() && C1V.isMinSignedValue())
826           return PoisonValue::get(CI1->getType());   // MIN_INT / -1 -> poison
827         return ConstantInt::get(CI1->getContext(), C1V.sdiv(C2V));
828       case Instruction::URem:
829         assert(!CI2->isZero() && "Div by zero handled above");
830         return ConstantInt::get(CI1->getContext(), C1V.urem(C2V));
831       case Instruction::SRem:
832         assert(!CI2->isZero() && "Div by zero handled above");
833         if (C2V.isAllOnes() && C1V.isMinSignedValue())
834           return PoisonValue::get(CI1->getType());   // MIN_INT % -1 -> poison
835         return ConstantInt::get(CI1->getContext(), C1V.srem(C2V));
836       case Instruction::And:
837         return ConstantInt::get(CI1->getContext(), C1V & C2V);
838       case Instruction::Or:
839         return ConstantInt::get(CI1->getContext(), C1V | C2V);
840       case Instruction::Xor:
841         return ConstantInt::get(CI1->getContext(), C1V ^ C2V);
842       case Instruction::Shl:
843         if (C2V.ult(C1V.getBitWidth()))
844           return ConstantInt::get(CI1->getContext(), C1V.shl(C2V));
845         return PoisonValue::get(C1->getType()); // too big shift is poison
846       case Instruction::LShr:
847         if (C2V.ult(C1V.getBitWidth()))
848           return ConstantInt::get(CI1->getContext(), C1V.lshr(C2V));
849         return PoisonValue::get(C1->getType()); // too big shift is poison
850       case Instruction::AShr:
851         if (C2V.ult(C1V.getBitWidth()))
852           return ConstantInt::get(CI1->getContext(), C1V.ashr(C2V));
853         return PoisonValue::get(C1->getType()); // too big shift is poison
854       }
855     }
856 
857     switch (Opcode) {
858     case Instruction::SDiv:
859     case Instruction::UDiv:
860     case Instruction::URem:
861     case Instruction::SRem:
862     case Instruction::LShr:
863     case Instruction::AShr:
864     case Instruction::Shl:
865       if (CI1->isZero()) return C1;
866       break;
867     default:
868       break;
869     }
870   } else if (ConstantFP *CFP1 = dyn_cast<ConstantFP>(C1)) {
871     if (ConstantFP *CFP2 = dyn_cast<ConstantFP>(C2)) {
872       const APFloat &C1V = CFP1->getValueAPF();
873       const APFloat &C2V = CFP2->getValueAPF();
874       APFloat C3V = C1V;  // copy for modification
875       switch (Opcode) {
876       default:
877         break;
878       case Instruction::FAdd:
879         (void)C3V.add(C2V, APFloat::rmNearestTiesToEven);
880         return ConstantFP::get(C1->getContext(), C3V);
881       case Instruction::FSub:
882         (void)C3V.subtract(C2V, APFloat::rmNearestTiesToEven);
883         return ConstantFP::get(C1->getContext(), C3V);
884       case Instruction::FMul:
885         (void)C3V.multiply(C2V, APFloat::rmNearestTiesToEven);
886         return ConstantFP::get(C1->getContext(), C3V);
887       case Instruction::FDiv:
888         (void)C3V.divide(C2V, APFloat::rmNearestTiesToEven);
889         return ConstantFP::get(C1->getContext(), C3V);
890       case Instruction::FRem:
891         (void)C3V.mod(C2V);
892         return ConstantFP::get(C1->getContext(), C3V);
893       }
894     }
895   } else if (auto *VTy = dyn_cast<VectorType>(C1->getType())) {
896     // Fast path for splatted constants.
897     if (Constant *C2Splat = C2->getSplatValue()) {
898       if (Instruction::isIntDivRem(Opcode) && C2Splat->isNullValue())
899         return PoisonValue::get(VTy);
900       if (Constant *C1Splat = C1->getSplatValue()) {
901         Constant *Res =
902             ConstantExpr::isDesirableBinOp(Opcode)
903                 ? ConstantExpr::get(Opcode, C1Splat, C2Splat)
904                 : ConstantFoldBinaryInstruction(Opcode, C1Splat, C2Splat);
905         if (!Res)
906           return nullptr;
907         return ConstantVector::getSplat(VTy->getElementCount(), Res);
908       }
909     }
910 
911     if (auto *FVTy = dyn_cast<FixedVectorType>(VTy)) {
912       // Fold each element and create a vector constant from those constants.
913       SmallVector<Constant*, 16> Result;
914       Type *Ty = IntegerType::get(FVTy->getContext(), 32);
915       for (unsigned i = 0, e = FVTy->getNumElements(); i != e; ++i) {
916         Constant *ExtractIdx = ConstantInt::get(Ty, i);
917         Constant *LHS = ConstantExpr::getExtractElement(C1, ExtractIdx);
918         Constant *RHS = ConstantExpr::getExtractElement(C2, ExtractIdx);
919 
920         // If any element of a divisor vector is zero, the whole op is poison.
921         if (Instruction::isIntDivRem(Opcode) && RHS->isNullValue())
922           return PoisonValue::get(VTy);
923 
924         Constant *Res = ConstantExpr::isDesirableBinOp(Opcode)
925                             ? ConstantExpr::get(Opcode, LHS, RHS)
926                             : ConstantFoldBinaryInstruction(Opcode, LHS, RHS);
927         if (!Res)
928           return nullptr;
929         Result.push_back(Res);
930       }
931 
932       return ConstantVector::get(Result);
933     }
934   }
935 
936   if (ConstantExpr *CE1 = dyn_cast<ConstantExpr>(C1)) {
937     // There are many possible foldings we could do here.  We should probably
938     // at least fold add of a pointer with an integer into the appropriate
939     // getelementptr.  This will improve alias analysis a bit.
940 
941     // Given ((a + b) + c), if (b + c) folds to something interesting, return
942     // (a + (b + c)).
943     if (Instruction::isAssociative(Opcode) && CE1->getOpcode() == Opcode) {
944       Constant *T = ConstantExpr::get(Opcode, CE1->getOperand(1), C2);
945       if (!isa<ConstantExpr>(T) || cast<ConstantExpr>(T)->getOpcode() != Opcode)
946         return ConstantExpr::get(Opcode, CE1->getOperand(0), T);
947     }
948   } else if (isa<ConstantExpr>(C2)) {
949     // If C2 is a constant expr and C1 isn't, flop them around and fold the
950     // other way if possible.
951     if (Instruction::isCommutative(Opcode))
952       return ConstantFoldBinaryInstruction(Opcode, C2, C1);
953   }
954 
955   // i1 can be simplified in many cases.
956   if (C1->getType()->isIntegerTy(1)) {
957     switch (Opcode) {
958     case Instruction::Add:
959     case Instruction::Sub:
960       return ConstantExpr::getXor(C1, C2);
961     case Instruction::Shl:
962     case Instruction::LShr:
963     case Instruction::AShr:
964       // We can assume that C2 == 0.  If it were one the result would be
965       // undefined because the shift value is as large as the bitwidth.
966       return C1;
967     case Instruction::SDiv:
968     case Instruction::UDiv:
969       // We can assume that C2 == 1.  If it were zero the result would be
970       // undefined through division by zero.
971       return C1;
972     case Instruction::URem:
973     case Instruction::SRem:
974       // We can assume that C2 == 1.  If it were zero the result would be
975       // undefined through division by zero.
976       return ConstantInt::getFalse(C1->getContext());
977     default:
978       break;
979     }
980   }
981 
982   // We don't know how to fold this.
983   return nullptr;
984 }
985 
areGlobalsPotentiallyEqual(const GlobalValue * GV1,const GlobalValue * GV2)986 static ICmpInst::Predicate areGlobalsPotentiallyEqual(const GlobalValue *GV1,
987                                                       const GlobalValue *GV2) {
988   auto isGlobalUnsafeForEquality = [](const GlobalValue *GV) {
989     if (GV->isInterposable() || GV->hasGlobalUnnamedAddr())
990       return true;
991     if (const auto *GVar = dyn_cast<GlobalVariable>(GV)) {
992       Type *Ty = GVar->getValueType();
993       // A global with opaque type might end up being zero sized.
994       if (!Ty->isSized())
995         return true;
996       // A global with an empty type might lie at the address of any other
997       // global.
998       if (Ty->isEmptyTy())
999         return true;
1000     }
1001     return false;
1002   };
1003   // Don't try to decide equality of aliases.
1004   if (!isa<GlobalAlias>(GV1) && !isa<GlobalAlias>(GV2))
1005     if (!isGlobalUnsafeForEquality(GV1) && !isGlobalUnsafeForEquality(GV2))
1006       return ICmpInst::ICMP_NE;
1007   return ICmpInst::BAD_ICMP_PREDICATE;
1008 }
1009 
1010 /// This function determines if there is anything we can decide about the two
1011 /// constants provided. This doesn't need to handle simple things like integer
1012 /// comparisons, but should instead handle ConstantExprs and GlobalValues.
1013 /// If we can determine that the two constants have a particular relation to
1014 /// each other, we should return the corresponding ICmp predicate, otherwise
1015 /// return ICmpInst::BAD_ICMP_PREDICATE.
evaluateICmpRelation(Constant * V1,Constant * V2)1016 static ICmpInst::Predicate evaluateICmpRelation(Constant *V1, Constant *V2) {
1017   assert(V1->getType() == V2->getType() &&
1018          "Cannot compare different types of values!");
1019   if (V1 == V2) return ICmpInst::ICMP_EQ;
1020 
1021   // The following folds only apply to pointers.
1022   if (!V1->getType()->isPointerTy())
1023     return ICmpInst::BAD_ICMP_PREDICATE;
1024 
1025   // To simplify this code we canonicalize the relation so that the first
1026   // operand is always the most "complex" of the two.  We consider simple
1027   // constants (like ConstantPointerNull) to be the simplest, followed by
1028   // BlockAddress, GlobalValues, and ConstantExpr's (the most complex).
1029   auto GetComplexity = [](Constant *V) {
1030     if (isa<ConstantExpr>(V))
1031       return 3;
1032     if (isa<GlobalValue>(V))
1033       return 2;
1034     if (isa<BlockAddress>(V))
1035       return 1;
1036     return 0;
1037   };
1038   if (GetComplexity(V1) < GetComplexity(V2)) {
1039     ICmpInst::Predicate SwappedRelation = evaluateICmpRelation(V2, V1);
1040     if (SwappedRelation != ICmpInst::BAD_ICMP_PREDICATE)
1041       return ICmpInst::getSwappedPredicate(SwappedRelation);
1042     return ICmpInst::BAD_ICMP_PREDICATE;
1043   }
1044 
1045   if (const BlockAddress *BA = dyn_cast<BlockAddress>(V1)) {
1046     // Now we know that the RHS is a BlockAddress or simple constant.
1047     if (const BlockAddress *BA2 = dyn_cast<BlockAddress>(V2)) {
1048       // Block address in another function can't equal this one, but block
1049       // addresses in the current function might be the same if blocks are
1050       // empty.
1051       if (BA2->getFunction() != BA->getFunction())
1052         return ICmpInst::ICMP_NE;
1053     } else if (isa<ConstantPointerNull>(V2)) {
1054       return ICmpInst::ICMP_NE;
1055     }
1056   } else if (const GlobalValue *GV = dyn_cast<GlobalValue>(V1)) {
1057     // Now we know that the RHS is a GlobalValue, BlockAddress or simple
1058     // constant.
1059     if (const GlobalValue *GV2 = dyn_cast<GlobalValue>(V2)) {
1060       return areGlobalsPotentiallyEqual(GV, GV2);
1061     } else if (isa<BlockAddress>(V2)) {
1062       return ICmpInst::ICMP_NE; // Globals never equal labels.
1063     } else if (isa<ConstantPointerNull>(V2)) {
1064       // GlobalVals can never be null unless they have external weak linkage.
1065       // We don't try to evaluate aliases here.
1066       // NOTE: We should not be doing this constant folding if null pointer
1067       // is considered valid for the function. But currently there is no way to
1068       // query it from the Constant type.
1069       if (!GV->hasExternalWeakLinkage() && !isa<GlobalAlias>(GV) &&
1070           !NullPointerIsDefined(nullptr /* F */,
1071                                 GV->getType()->getAddressSpace()))
1072         return ICmpInst::ICMP_UGT;
1073     }
1074   } else if (auto *CE1 = dyn_cast<ConstantExpr>(V1)) {
1075     // Ok, the LHS is known to be a constantexpr.  The RHS can be any of a
1076     // constantexpr, a global, block address, or a simple constant.
1077     Constant *CE1Op0 = CE1->getOperand(0);
1078 
1079     switch (CE1->getOpcode()) {
1080     case Instruction::GetElementPtr: {
1081       GEPOperator *CE1GEP = cast<GEPOperator>(CE1);
1082       // Ok, since this is a getelementptr, we know that the constant has a
1083       // pointer type.  Check the various cases.
1084       if (isa<ConstantPointerNull>(V2)) {
1085         // If we are comparing a GEP to a null pointer, check to see if the base
1086         // of the GEP equals the null pointer.
1087         if (const GlobalValue *GV = dyn_cast<GlobalValue>(CE1Op0)) {
1088           // If its not weak linkage, the GVal must have a non-zero address
1089           // so the result is greater-than
1090           if (!GV->hasExternalWeakLinkage() && CE1GEP->isInBounds())
1091             return ICmpInst::ICMP_UGT;
1092         }
1093       } else if (const GlobalValue *GV2 = dyn_cast<GlobalValue>(V2)) {
1094         if (const GlobalValue *GV = dyn_cast<GlobalValue>(CE1Op0)) {
1095           if (GV != GV2) {
1096             if (CE1GEP->hasAllZeroIndices())
1097               return areGlobalsPotentiallyEqual(GV, GV2);
1098             return ICmpInst::BAD_ICMP_PREDICATE;
1099           }
1100         }
1101       } else if (const auto *CE2GEP = dyn_cast<GEPOperator>(V2)) {
1102         // By far the most common case to handle is when the base pointers are
1103         // obviously to the same global.
1104         const Constant *CE2Op0 = cast<Constant>(CE2GEP->getPointerOperand());
1105         if (isa<GlobalValue>(CE1Op0) && isa<GlobalValue>(CE2Op0)) {
1106           // Don't know relative ordering, but check for inequality.
1107           if (CE1Op0 != CE2Op0) {
1108             if (CE1GEP->hasAllZeroIndices() && CE2GEP->hasAllZeroIndices())
1109               return areGlobalsPotentiallyEqual(cast<GlobalValue>(CE1Op0),
1110                                                 cast<GlobalValue>(CE2Op0));
1111             return ICmpInst::BAD_ICMP_PREDICATE;
1112           }
1113         }
1114       }
1115       break;
1116     }
1117     default:
1118       break;
1119     }
1120   }
1121 
1122   return ICmpInst::BAD_ICMP_PREDICATE;
1123 }
1124 
ConstantFoldCompareInstruction(CmpInst::Predicate Predicate,Constant * C1,Constant * C2)1125 Constant *llvm::ConstantFoldCompareInstruction(CmpInst::Predicate Predicate,
1126                                                Constant *C1, Constant *C2) {
1127   Type *ResultTy;
1128   if (VectorType *VT = dyn_cast<VectorType>(C1->getType()))
1129     ResultTy = VectorType::get(Type::getInt1Ty(C1->getContext()),
1130                                VT->getElementCount());
1131   else
1132     ResultTy = Type::getInt1Ty(C1->getContext());
1133 
1134   // Fold FCMP_FALSE/FCMP_TRUE unconditionally.
1135   if (Predicate == FCmpInst::FCMP_FALSE)
1136     return Constant::getNullValue(ResultTy);
1137 
1138   if (Predicate == FCmpInst::FCMP_TRUE)
1139     return Constant::getAllOnesValue(ResultTy);
1140 
1141   // Handle some degenerate cases first
1142   if (isa<PoisonValue>(C1) || isa<PoisonValue>(C2))
1143     return PoisonValue::get(ResultTy);
1144 
1145   if (isa<UndefValue>(C1) || isa<UndefValue>(C2)) {
1146     bool isIntegerPredicate = ICmpInst::isIntPredicate(Predicate);
1147     // For EQ and NE, we can always pick a value for the undef to make the
1148     // predicate pass or fail, so we can return undef.
1149     // Also, if both operands are undef, we can return undef for int comparison.
1150     if (ICmpInst::isEquality(Predicate) || (isIntegerPredicate && C1 == C2))
1151       return UndefValue::get(ResultTy);
1152 
1153     // Otherwise, for integer compare, pick the same value as the non-undef
1154     // operand, and fold it to true or false.
1155     if (isIntegerPredicate)
1156       return ConstantInt::get(ResultTy, CmpInst::isTrueWhenEqual(Predicate));
1157 
1158     // Choosing NaN for the undef will always make unordered comparison succeed
1159     // and ordered comparison fails.
1160     return ConstantInt::get(ResultTy, CmpInst::isUnordered(Predicate));
1161   }
1162 
1163   if (C2->isNullValue()) {
1164     // The caller is expected to commute the operands if the constant expression
1165     // is C2.
1166     // C1 >= 0 --> true
1167     if (Predicate == ICmpInst::ICMP_UGE)
1168       return Constant::getAllOnesValue(ResultTy);
1169     // C1 < 0 --> false
1170     if (Predicate == ICmpInst::ICMP_ULT)
1171       return Constant::getNullValue(ResultTy);
1172   }
1173 
1174   // If the comparison is a comparison between two i1's, simplify it.
1175   if (C1->getType()->isIntegerTy(1)) {
1176     switch (Predicate) {
1177     case ICmpInst::ICMP_EQ:
1178       if (isa<ConstantInt>(C2))
1179         return ConstantExpr::getXor(C1, ConstantExpr::getNot(C2));
1180       return ConstantExpr::getXor(ConstantExpr::getNot(C1), C2);
1181     case ICmpInst::ICMP_NE:
1182       return ConstantExpr::getXor(C1, C2);
1183     default:
1184       break;
1185     }
1186   }
1187 
1188   if (isa<ConstantInt>(C1) && isa<ConstantInt>(C2)) {
1189     const APInt &V1 = cast<ConstantInt>(C1)->getValue();
1190     const APInt &V2 = cast<ConstantInt>(C2)->getValue();
1191     return ConstantInt::get(ResultTy, ICmpInst::compare(V1, V2, Predicate));
1192   } else if (isa<ConstantFP>(C1) && isa<ConstantFP>(C2)) {
1193     const APFloat &C1V = cast<ConstantFP>(C1)->getValueAPF();
1194     const APFloat &C2V = cast<ConstantFP>(C2)->getValueAPF();
1195     return ConstantInt::get(ResultTy, FCmpInst::compare(C1V, C2V, Predicate));
1196   } else if (auto *C1VTy = dyn_cast<VectorType>(C1->getType())) {
1197 
1198     // Fast path for splatted constants.
1199     if (Constant *C1Splat = C1->getSplatValue())
1200       if (Constant *C2Splat = C2->getSplatValue())
1201         if (Constant *Elt =
1202                 ConstantFoldCompareInstruction(Predicate, C1Splat, C2Splat))
1203           return ConstantVector::getSplat(C1VTy->getElementCount(), Elt);
1204 
1205     // Do not iterate on scalable vector. The number of elements is unknown at
1206     // compile-time.
1207     if (isa<ScalableVectorType>(C1VTy))
1208       return nullptr;
1209 
1210     // If we can constant fold the comparison of each element, constant fold
1211     // the whole vector comparison.
1212     SmallVector<Constant*, 4> ResElts;
1213     Type *Ty = IntegerType::get(C1->getContext(), 32);
1214     // Compare the elements, producing an i1 result or constant expr.
1215     for (unsigned I = 0, E = C1VTy->getElementCount().getKnownMinValue();
1216          I != E; ++I) {
1217       Constant *C1E =
1218           ConstantExpr::getExtractElement(C1, ConstantInt::get(Ty, I));
1219       Constant *C2E =
1220           ConstantExpr::getExtractElement(C2, ConstantInt::get(Ty, I));
1221       Constant *Elt = ConstantFoldCompareInstruction(Predicate, C1E, C2E);
1222       if (!Elt)
1223         return nullptr;
1224 
1225       ResElts.push_back(Elt);
1226     }
1227 
1228     return ConstantVector::get(ResElts);
1229   }
1230 
1231   if (C1->getType()->isFPOrFPVectorTy()) {
1232     if (C1 == C2) {
1233       // We know that C1 == C2 || isUnordered(C1, C2).
1234       if (Predicate == FCmpInst::FCMP_ONE)
1235         return ConstantInt::getFalse(ResultTy);
1236       else if (Predicate == FCmpInst::FCMP_UEQ)
1237         return ConstantInt::getTrue(ResultTy);
1238     }
1239   } else {
1240     // Evaluate the relation between the two constants, per the predicate.
1241     int Result = -1;  // -1 = unknown, 0 = known false, 1 = known true.
1242     switch (evaluateICmpRelation(C1, C2)) {
1243     default: llvm_unreachable("Unknown relational!");
1244     case ICmpInst::BAD_ICMP_PREDICATE:
1245       break;  // Couldn't determine anything about these constants.
1246     case ICmpInst::ICMP_EQ:   // We know the constants are equal!
1247       // If we know the constants are equal, we can decide the result of this
1248       // computation precisely.
1249       Result = ICmpInst::isTrueWhenEqual(Predicate);
1250       break;
1251     case ICmpInst::ICMP_ULT:
1252       switch (Predicate) {
1253       case ICmpInst::ICMP_ULT: case ICmpInst::ICMP_NE: case ICmpInst::ICMP_ULE:
1254         Result = 1; break;
1255       case ICmpInst::ICMP_UGT: case ICmpInst::ICMP_EQ: case ICmpInst::ICMP_UGE:
1256         Result = 0; break;
1257       default:
1258         break;
1259       }
1260       break;
1261     case ICmpInst::ICMP_SLT:
1262       switch (Predicate) {
1263       case ICmpInst::ICMP_SLT: case ICmpInst::ICMP_NE: case ICmpInst::ICMP_SLE:
1264         Result = 1; break;
1265       case ICmpInst::ICMP_SGT: case ICmpInst::ICMP_EQ: case ICmpInst::ICMP_SGE:
1266         Result = 0; break;
1267       default:
1268         break;
1269       }
1270       break;
1271     case ICmpInst::ICMP_UGT:
1272       switch (Predicate) {
1273       case ICmpInst::ICMP_UGT: case ICmpInst::ICMP_NE: case ICmpInst::ICMP_UGE:
1274         Result = 1; break;
1275       case ICmpInst::ICMP_ULT: case ICmpInst::ICMP_EQ: case ICmpInst::ICMP_ULE:
1276         Result = 0; break;
1277       default:
1278         break;
1279       }
1280       break;
1281     case ICmpInst::ICMP_SGT:
1282       switch (Predicate) {
1283       case ICmpInst::ICMP_SGT: case ICmpInst::ICMP_NE: case ICmpInst::ICMP_SGE:
1284         Result = 1; break;
1285       case ICmpInst::ICMP_SLT: case ICmpInst::ICMP_EQ: case ICmpInst::ICMP_SLE:
1286         Result = 0; break;
1287       default:
1288         break;
1289       }
1290       break;
1291     case ICmpInst::ICMP_ULE:
1292       if (Predicate == ICmpInst::ICMP_UGT)
1293         Result = 0;
1294       if (Predicate == ICmpInst::ICMP_ULT || Predicate == ICmpInst::ICMP_ULE)
1295         Result = 1;
1296       break;
1297     case ICmpInst::ICMP_SLE:
1298       if (Predicate == ICmpInst::ICMP_SGT)
1299         Result = 0;
1300       if (Predicate == ICmpInst::ICMP_SLT || Predicate == ICmpInst::ICMP_SLE)
1301         Result = 1;
1302       break;
1303     case ICmpInst::ICMP_UGE:
1304       if (Predicate == ICmpInst::ICMP_ULT)
1305         Result = 0;
1306       if (Predicate == ICmpInst::ICMP_UGT || Predicate == ICmpInst::ICMP_UGE)
1307         Result = 1;
1308       break;
1309     case ICmpInst::ICMP_SGE:
1310       if (Predicate == ICmpInst::ICMP_SLT)
1311         Result = 0;
1312       if (Predicate == ICmpInst::ICMP_SGT || Predicate == ICmpInst::ICMP_SGE)
1313         Result = 1;
1314       break;
1315     case ICmpInst::ICMP_NE:
1316       if (Predicate == ICmpInst::ICMP_EQ)
1317         Result = 0;
1318       if (Predicate == ICmpInst::ICMP_NE)
1319         Result = 1;
1320       break;
1321     }
1322 
1323     // If we evaluated the result, return it now.
1324     if (Result != -1)
1325       return ConstantInt::get(ResultTy, Result);
1326 
1327     if ((!isa<ConstantExpr>(C1) && isa<ConstantExpr>(C2)) ||
1328         (C1->isNullValue() && !C2->isNullValue())) {
1329       // If C2 is a constant expr and C1 isn't, flip them around and fold the
1330       // other way if possible.
1331       // Also, if C1 is null and C2 isn't, flip them around.
1332       Predicate = ICmpInst::getSwappedPredicate(Predicate);
1333       return ConstantFoldCompareInstruction(Predicate, C2, C1);
1334     }
1335   }
1336   return nullptr;
1337 }
1338 
ConstantFoldGetElementPtr(Type * PointeeTy,Constant * C,std::optional<ConstantRange> InRange,ArrayRef<Value * > Idxs)1339 Constant *llvm::ConstantFoldGetElementPtr(Type *PointeeTy, Constant *C,
1340                                           std::optional<ConstantRange> InRange,
1341                                           ArrayRef<Value *> Idxs) {
1342   if (Idxs.empty()) return C;
1343 
1344   Type *GEPTy = GetElementPtrInst::getGEPReturnType(
1345       C, ArrayRef((Value *const *)Idxs.data(), Idxs.size()));
1346 
1347   if (isa<PoisonValue>(C))
1348     return PoisonValue::get(GEPTy);
1349 
1350   if (isa<UndefValue>(C))
1351     return UndefValue::get(GEPTy);
1352 
1353   auto IsNoOp = [&]() {
1354     // Avoid losing inrange information.
1355     if (InRange)
1356       return false;
1357 
1358     return all_of(Idxs, [](Value *Idx) {
1359       Constant *IdxC = cast<Constant>(Idx);
1360       return IdxC->isNullValue() || isa<UndefValue>(IdxC);
1361     });
1362   };
1363   if (IsNoOp())
1364     return GEPTy->isVectorTy() && !C->getType()->isVectorTy()
1365                ? ConstantVector::getSplat(
1366                      cast<VectorType>(GEPTy)->getElementCount(), C)
1367                : C;
1368 
1369   return nullptr;
1370 }
1371