1 //===- InstCombineNegator.cpp -----------------------------------*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements sinking of negation into expression trees,
10 // as long as that can be done without increasing instruction count.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "InstCombineInternal.h"
15 #include "llvm/ADT/APInt.h"
16 #include "llvm/ADT/ArrayRef.h"
17 #include "llvm/ADT/DenseMap.h"
18 #include "llvm/ADT/None.h"
19 #include "llvm/ADT/Optional.h"
20 #include "llvm/ADT/STLExtras.h"
21 #include "llvm/ADT/SmallVector.h"
22 #include "llvm/ADT/Statistic.h"
23 #include "llvm/ADT/StringRef.h"
24 #include "llvm/ADT/Twine.h"
25 #include "llvm/ADT/iterator_range.h"
26 #include "llvm/Analysis/TargetFolder.h"
27 #include "llvm/Analysis/ValueTracking.h"
28 #include "llvm/IR/Constant.h"
29 #include "llvm/IR/Constants.h"
30 #include "llvm/IR/DebugLoc.h"
31 #include "llvm/IR/IRBuilder.h"
32 #include "llvm/IR/Instruction.h"
33 #include "llvm/IR/Instructions.h"
34 #include "llvm/IR/PatternMatch.h"
35 #include "llvm/IR/Type.h"
36 #include "llvm/IR/Use.h"
37 #include "llvm/IR/User.h"
38 #include "llvm/IR/Value.h"
39 #include "llvm/Support/Casting.h"
40 #include "llvm/Support/CommandLine.h"
41 #include "llvm/Support/Compiler.h"
42 #include "llvm/Support/DebugCounter.h"
43 #include "llvm/Support/ErrorHandling.h"
44 #include "llvm/Support/raw_ostream.h"
45 #include "llvm/Transforms/InstCombine/InstCombiner.h"
46 #include <cassert>
47 #include <cstdint>
48 #include <functional>
49 #include <tuple>
50 #include <type_traits>
51 #include <utility>
52 
53 namespace llvm {
54 class AssumptionCache;
55 class DataLayout;
56 class DominatorTree;
57 class LLVMContext;
58 } // namespace llvm
59 
60 using namespace llvm;
61 
62 #define DEBUG_TYPE "instcombine"
63 
64 STATISTIC(NegatorTotalNegationsAttempted,
65           "Negator: Number of negations attempted to be sinked");
66 STATISTIC(NegatorNumTreesNegated,
67           "Negator: Number of negations successfully sinked");
68 STATISTIC(NegatorMaxDepthVisited, "Negator: Maximal traversal depth ever "
69                                   "reached while attempting to sink negation");
70 STATISTIC(NegatorTimesDepthLimitReached,
71           "Negator: How many times did the traversal depth limit was reached "
72           "during sinking");
73 STATISTIC(
74     NegatorNumValuesVisited,
75     "Negator: Total number of values visited during attempts to sink negation");
76 STATISTIC(NegatorNumNegationsFoundInCache,
77           "Negator: How many negations did we retrieve/reuse from cache");
78 STATISTIC(NegatorMaxTotalValuesVisited,
79           "Negator: Maximal number of values ever visited while attempting to "
80           "sink negation");
81 STATISTIC(NegatorNumInstructionsCreatedTotal,
82           "Negator: Number of new negated instructions created, total");
83 STATISTIC(NegatorMaxInstructionsCreated,
84           "Negator: Maximal number of new instructions created during negation "
85           "attempt");
86 STATISTIC(NegatorNumInstructionsNegatedSuccess,
87           "Negator: Number of new negated instructions created in successful "
88           "negation sinking attempts");
89 
90 DEBUG_COUNTER(NegatorCounter, "instcombine-negator",
91               "Controls Negator transformations in InstCombine pass");
92 
93 static cl::opt<bool>
94     NegatorEnabled("instcombine-negator-enabled", cl::init(true),
95                    cl::desc("Should we attempt to sink negations?"));
96 
97 static cl::opt<unsigned>
98     NegatorMaxDepth("instcombine-negator-max-depth",
99                     cl::init(NegatorDefaultMaxDepth),
100                     cl::desc("What is the maximal lookup depth when trying to "
101                              "check for viability of negation sinking."));
102 
103 Negator::Negator(LLVMContext &C, const DataLayout &DL_, AssumptionCache &AC_,
104                  const DominatorTree &DT_, bool IsTrulyNegation_)
105     : Builder(C, TargetFolder(DL_),
106               IRBuilderCallbackInserter([&](Instruction *I) {
107                 ++NegatorNumInstructionsCreatedTotal;
108                 NewInstructions.push_back(I);
109               })),
110       DL(DL_), AC(AC_), DT(DT_), IsTrulyNegation(IsTrulyNegation_) {}
111 
112 #if LLVM_ENABLE_STATS
113 Negator::~Negator() {
114   NegatorMaxTotalValuesVisited.updateMax(NumValuesVisitedInThisNegator);
115 }
116 #endif
117 
118 // Due to the InstCombine's worklist management, there are no guarantees that
119 // each instruction we'll encounter has been visited by InstCombine already.
120 // In particular, most importantly for us, that means we have to canonicalize
121 // constants to RHS ourselves, since that is helpful sometimes.
122 std::array<Value *, 2> Negator::getSortedOperandsOfBinOp(Instruction *I) {
123   assert(I->getNumOperands() == 2 && "Only for binops!");
124   std::array<Value *, 2> Ops{I->getOperand(0), I->getOperand(1)};
125   if (I->isCommutative() && InstCombiner::getComplexity(I->getOperand(0)) <
126                                 InstCombiner::getComplexity(I->getOperand(1)))
127     std::swap(Ops[0], Ops[1]);
128   return Ops;
129 }
130 
131 // FIXME: can this be reworked into a worklist-based algorithm while preserving
132 // the depth-first, early bailout traversal?
133 LLVM_NODISCARD Value *Negator::visitImpl(Value *V, unsigned Depth) {
134   // -(undef) -> undef.
135   if (match(V, m_Undef()))
136     return V;
137 
138   // In i1, negation can simply be ignored.
139   if (V->getType()->isIntOrIntVectorTy(1))
140     return V;
141 
142   Value *X;
143 
144   // -(-(X)) -> X.
145   if (match(V, m_Neg(m_Value(X))))
146     return X;
147 
148   // Integral constants can be freely negated.
149   if (match(V, m_AnyIntegralConstant()))
150     return ConstantExpr::getNeg(cast<Constant>(V), /*HasNUW=*/false,
151                                 /*HasNSW=*/false);
152 
153   // If we have a non-instruction, then give up.
154   if (!isa<Instruction>(V))
155     return nullptr;
156 
157   // If we have started with a true negation (i.e. `sub 0, %y`), then if we've
158   // got instruction that does not require recursive reasoning, we can still
159   // negate it even if it has other uses, without increasing instruction count.
160   if (!V->hasOneUse() && !IsTrulyNegation)
161     return nullptr;
162 
163   auto *I = cast<Instruction>(V);
164   unsigned BitWidth = I->getType()->getScalarSizeInBits();
165 
166   // We must preserve the insertion point and debug info that is set in the
167   // builder at the time this function is called.
168   InstCombiner::BuilderTy::InsertPointGuard Guard(Builder);
169   // And since we are trying to negate instruction I, that tells us about the
170   // insertion point and the debug info that we need to keep.
171   Builder.SetInsertPoint(I);
172 
173   // In some cases we can give the answer without further recursion.
174   switch (I->getOpcode()) {
175   case Instruction::Add: {
176     std::array<Value *, 2> Ops = getSortedOperandsOfBinOp(I);
177     // `inc` is always negatible.
178     if (match(Ops[1], m_One()))
179       return Builder.CreateNot(Ops[0], I->getName() + ".neg");
180     break;
181   }
182   case Instruction::Xor:
183     // `not` is always negatible.
184     if (match(I, m_Not(m_Value(X))))
185       return Builder.CreateAdd(X, ConstantInt::get(X->getType(), 1),
186                                I->getName() + ".neg");
187     break;
188   case Instruction::AShr:
189   case Instruction::LShr: {
190     // Right-shift sign bit smear is negatible.
191     const APInt *Op1Val;
192     if (match(I->getOperand(1), m_APInt(Op1Val)) && *Op1Val == BitWidth - 1) {
193       Value *BO = I->getOpcode() == Instruction::AShr
194                       ? Builder.CreateLShr(I->getOperand(0), I->getOperand(1))
195                       : Builder.CreateAShr(I->getOperand(0), I->getOperand(1));
196       if (auto *NewInstr = dyn_cast<Instruction>(BO)) {
197         NewInstr->copyIRFlags(I);
198         NewInstr->setName(I->getName() + ".neg");
199       }
200       return BO;
201     }
202     // While we could negate exact arithmetic shift:
203     //   ashr exact %x, C  -->   sdiv exact i8 %x, -1<<C
204     // iff C != 0 and C u< bitwidth(%x), we don't want to,
205     // because division is *THAT* much worse than a shift.
206     break;
207   }
208   case Instruction::SExt:
209   case Instruction::ZExt:
210     // `*ext` of i1 is always negatible
211     if (I->getOperand(0)->getType()->isIntOrIntVectorTy(1))
212       return I->getOpcode() == Instruction::SExt
213                  ? Builder.CreateZExt(I->getOperand(0), I->getType(),
214                                       I->getName() + ".neg")
215                  : Builder.CreateSExt(I->getOperand(0), I->getType(),
216                                       I->getName() + ".neg");
217     break;
218   default:
219     break; // Other instructions require recursive reasoning.
220   }
221 
222   // Some other cases, while still don't require recursion,
223   // are restricted to the one-use case.
224   if (!V->hasOneUse())
225     return nullptr;
226 
227   switch (I->getOpcode()) {
228   case Instruction::Sub:
229     // `sub` is always negatible.
230     // But if the old `sub` sticks around, even thought we don't increase
231     // instruction count, this is a likely regression since we increased
232     // live-range of *both* of the operands, which might lead to more spilling.
233     return Builder.CreateSub(I->getOperand(1), I->getOperand(0),
234                              I->getName() + ".neg");
235   case Instruction::SDiv:
236     // `sdiv` is negatible if divisor is not undef/INT_MIN/1.
237     // While this is normally not behind a use-check,
238     // let's consider division to be special since it's costly.
239     if (auto *Op1C = dyn_cast<Constant>(I->getOperand(1))) {
240       if (!Op1C->containsUndefElement() && Op1C->isNotMinSignedValue() &&
241           Op1C->isNotOneValue()) {
242         Value *BO =
243             Builder.CreateSDiv(I->getOperand(0), ConstantExpr::getNeg(Op1C),
244                                I->getName() + ".neg");
245         if (auto *NewInstr = dyn_cast<Instruction>(BO))
246           NewInstr->setIsExact(I->isExact());
247         return BO;
248       }
249     }
250     break;
251   }
252 
253   // Rest of the logic is recursive, so if it's time to give up then it's time.
254   if (Depth > NegatorMaxDepth) {
255     LLVM_DEBUG(dbgs() << "Negator: reached maximal allowed traversal depth in "
256                       << *V << ". Giving up.\n");
257     ++NegatorTimesDepthLimitReached;
258     return nullptr;
259   }
260 
261   switch (I->getOpcode()) {
262   case Instruction::Freeze: {
263     // `freeze` is negatible if its operand is negatible.
264     Value *NegOp = negate(I->getOperand(0), Depth + 1);
265     if (!NegOp) // Early return.
266       return nullptr;
267     return Builder.CreateFreeze(NegOp, I->getName() + ".neg");
268   }
269   case Instruction::PHI: {
270     // `phi` is negatible if all the incoming values are negatible.
271     auto *PHI = cast<PHINode>(I);
272     SmallVector<Value *, 4> NegatedIncomingValues(PHI->getNumOperands());
273     for (auto I : zip(PHI->incoming_values(), NegatedIncomingValues)) {
274       if (!(std::get<1>(I) =
275                 negate(std::get<0>(I), Depth + 1))) // Early return.
276         return nullptr;
277     }
278     // All incoming values are indeed negatible. Create negated PHI node.
279     PHINode *NegatedPHI = Builder.CreatePHI(
280         PHI->getType(), PHI->getNumOperands(), PHI->getName() + ".neg");
281     for (auto I : zip(NegatedIncomingValues, PHI->blocks()))
282       NegatedPHI->addIncoming(std::get<0>(I), std::get<1>(I));
283     return NegatedPHI;
284   }
285   case Instruction::Select: {
286     if (isKnownNegation(I->getOperand(1), I->getOperand(2))) {
287       // Of one hand of select is known to be negation of another hand,
288       // just swap the hands around.
289       auto *NewSelect = cast<SelectInst>(I->clone());
290       // Just swap the operands of the select.
291       NewSelect->swapValues();
292       // Don't swap prof metadata, we didn't change the branch behavior.
293       NewSelect->setName(I->getName() + ".neg");
294       Builder.Insert(NewSelect);
295       return NewSelect;
296     }
297     // `select` is negatible if both hands of `select` are negatible.
298     Value *NegOp1 = negate(I->getOperand(1), Depth + 1);
299     if (!NegOp1) // Early return.
300       return nullptr;
301     Value *NegOp2 = negate(I->getOperand(2), Depth + 1);
302     if (!NegOp2)
303       return nullptr;
304     // Do preserve the metadata!
305     return Builder.CreateSelect(I->getOperand(0), NegOp1, NegOp2,
306                                 I->getName() + ".neg", /*MDFrom=*/I);
307   }
308   case Instruction::ShuffleVector: {
309     // `shufflevector` is negatible if both operands are negatible.
310     auto *Shuf = cast<ShuffleVectorInst>(I);
311     Value *NegOp0 = negate(I->getOperand(0), Depth + 1);
312     if (!NegOp0) // Early return.
313       return nullptr;
314     Value *NegOp1 = negate(I->getOperand(1), Depth + 1);
315     if (!NegOp1)
316       return nullptr;
317     return Builder.CreateShuffleVector(NegOp0, NegOp1, Shuf->getShuffleMask(),
318                                        I->getName() + ".neg");
319   }
320   case Instruction::ExtractElement: {
321     // `extractelement` is negatible if source operand is negatible.
322     auto *EEI = cast<ExtractElementInst>(I);
323     Value *NegVector = negate(EEI->getVectorOperand(), Depth + 1);
324     if (!NegVector) // Early return.
325       return nullptr;
326     return Builder.CreateExtractElement(NegVector, EEI->getIndexOperand(),
327                                         I->getName() + ".neg");
328   }
329   case Instruction::InsertElement: {
330     // `insertelement` is negatible if both the source vector and
331     // element-to-be-inserted are negatible.
332     auto *IEI = cast<InsertElementInst>(I);
333     Value *NegVector = negate(IEI->getOperand(0), Depth + 1);
334     if (!NegVector) // Early return.
335       return nullptr;
336     Value *NegNewElt = negate(IEI->getOperand(1), Depth + 1);
337     if (!NegNewElt) // Early return.
338       return nullptr;
339     return Builder.CreateInsertElement(NegVector, NegNewElt, IEI->getOperand(2),
340                                        I->getName() + ".neg");
341   }
342   case Instruction::Trunc: {
343     // `trunc` is negatible if its operand is negatible.
344     Value *NegOp = negate(I->getOperand(0), Depth + 1);
345     if (!NegOp) // Early return.
346       return nullptr;
347     return Builder.CreateTrunc(NegOp, I->getType(), I->getName() + ".neg");
348   }
349   case Instruction::Shl: {
350     // `shl` is negatible if the first operand is negatible.
351     if (Value *NegOp0 = negate(I->getOperand(0), Depth + 1))
352       return Builder.CreateShl(NegOp0, I->getOperand(1), I->getName() + ".neg");
353     // Otherwise, `shl %x, C` can be interpreted as `mul %x, 1<<C`.
354     auto *Op1C = dyn_cast<Constant>(I->getOperand(1));
355     if (!Op1C) // Early return.
356       return nullptr;
357     return Builder.CreateMul(
358         I->getOperand(0),
359         ConstantExpr::getShl(Constant::getAllOnesValue(Op1C->getType()), Op1C),
360         I->getName() + ".neg");
361   }
362   case Instruction::Or: {
363     if (!haveNoCommonBitsSet(I->getOperand(0), I->getOperand(1), DL, &AC, I,
364                              &DT))
365       return nullptr; // Don't know how to handle `or` in general.
366     std::array<Value *, 2> Ops = getSortedOperandsOfBinOp(I);
367     // `or`/`add` are interchangeable when operands have no common bits set.
368     // `inc` is always negatible.
369     if (match(Ops[1], m_One()))
370       return Builder.CreateNot(Ops[0], I->getName() + ".neg");
371     // Else, just defer to Instruction::Add handling.
372     LLVM_FALLTHROUGH;
373   }
374   case Instruction::Add: {
375     // `add` is negatible if both of its operands are negatible.
376     SmallVector<Value *, 2> NegatedOps, NonNegatedOps;
377     for (Value *Op : I->operands()) {
378       // Can we sink the negation into this operand?
379       if (Value *NegOp = negate(Op, Depth + 1)) {
380         NegatedOps.emplace_back(NegOp); // Successfully negated operand!
381         continue;
382       }
383       // Failed to sink negation into this operand. IFF we started from negation
384       // and we manage to sink negation into one operand, we can still do this.
385       if (!IsTrulyNegation)
386         return nullptr;
387       NonNegatedOps.emplace_back(Op); // Just record which operand that was.
388     }
389     assert((NegatedOps.size() + NonNegatedOps.size()) == 2 &&
390            "Internal consistency sanity check.");
391     // Did we manage to sink negation into both of the operands?
392     if (NegatedOps.size() == 2) // Then we get to keep the `add`!
393       return Builder.CreateAdd(NegatedOps[0], NegatedOps[1],
394                                I->getName() + ".neg");
395     assert(IsTrulyNegation && "We should have early-exited then.");
396     // Completely failed to sink negation?
397     if (NonNegatedOps.size() == 2)
398       return nullptr;
399     // 0-(a+b) --> (-a)-b
400     return Builder.CreateSub(NegatedOps[0], NonNegatedOps[0],
401                              I->getName() + ".neg");
402   }
403   case Instruction::Xor: {
404     std::array<Value *, 2> Ops = getSortedOperandsOfBinOp(I);
405     // `xor` is negatible if one of its operands is invertible.
406     // FIXME: InstCombineInverter? But how to connect Inverter and Negator?
407     if (auto *C = dyn_cast<Constant>(Ops[1])) {
408       Value *Xor = Builder.CreateXor(Ops[0], ConstantExpr::getNot(C));
409       return Builder.CreateAdd(Xor, ConstantInt::get(Xor->getType(), 1),
410                                I->getName() + ".neg");
411     }
412     return nullptr;
413   }
414   case Instruction::Mul: {
415     std::array<Value *, 2> Ops = getSortedOperandsOfBinOp(I);
416     // `mul` is negatible if one of its operands is negatible.
417     Value *NegatedOp, *OtherOp;
418     // First try the second operand, in case it's a constant it will be best to
419     // just invert it instead of sinking the `neg` deeper.
420     if (Value *NegOp1 = negate(Ops[1], Depth + 1)) {
421       NegatedOp = NegOp1;
422       OtherOp = Ops[0];
423     } else if (Value *NegOp0 = negate(Ops[0], Depth + 1)) {
424       NegatedOp = NegOp0;
425       OtherOp = Ops[1];
426     } else
427       // Can't negate either of them.
428       return nullptr;
429     return Builder.CreateMul(NegatedOp, OtherOp, I->getName() + ".neg");
430   }
431   default:
432     return nullptr; // Don't know, likely not negatible for free.
433   }
434 
435   llvm_unreachable("Can't get here. We always return from switch.");
436 }
437 
438 LLVM_NODISCARD Value *Negator::negate(Value *V, unsigned Depth) {
439   NegatorMaxDepthVisited.updateMax(Depth);
440   ++NegatorNumValuesVisited;
441 
442 #if LLVM_ENABLE_STATS
443   ++NumValuesVisitedInThisNegator;
444 #endif
445 
446 #ifndef NDEBUG
447   // We can't ever have a Value with such an address.
448   Value *Placeholder = reinterpret_cast<Value *>(static_cast<uintptr_t>(-1));
449 #endif
450 
451   // Did we already try to negate this value?
452   auto NegationsCacheIterator = NegationsCache.find(V);
453   if (NegationsCacheIterator != NegationsCache.end()) {
454     ++NegatorNumNegationsFoundInCache;
455     Value *NegatedV = NegationsCacheIterator->second;
456     assert(NegatedV != Placeholder && "Encountered a cycle during negation.");
457     return NegatedV;
458   }
459 
460 #ifndef NDEBUG
461   // We did not find a cached result for negation of V. While there,
462   // let's temporairly cache a placeholder value, with the idea that if later
463   // during negation we fetch it from cache, we'll know we're in a cycle.
464   NegationsCache[V] = Placeholder;
465 #endif
466 
467   // No luck. Try negating it for real.
468   Value *NegatedV = visitImpl(V, Depth);
469   // And cache the (real) result for the future.
470   NegationsCache[V] = NegatedV;
471 
472   return NegatedV;
473 }
474 
475 LLVM_NODISCARD Optional<Negator::Result> Negator::run(Value *Root) {
476   Value *Negated = negate(Root, /*Depth=*/0);
477   if (!Negated) {
478     // We must cleanup newly-inserted instructions, to avoid any potential
479     // endless combine looping.
480     llvm::for_each(llvm::reverse(NewInstructions),
481                    [&](Instruction *I) { I->eraseFromParent(); });
482     return llvm::None;
483   }
484   return std::make_pair(ArrayRef<Instruction *>(NewInstructions), Negated);
485 }
486 
487 LLVM_NODISCARD Value *Negator::Negate(bool LHSIsZero, Value *Root,
488                                       InstCombinerImpl &IC) {
489   ++NegatorTotalNegationsAttempted;
490   LLVM_DEBUG(dbgs() << "Negator: attempting to sink negation into " << *Root
491                     << "\n");
492 
493   if (!NegatorEnabled || !DebugCounter::shouldExecute(NegatorCounter))
494     return nullptr;
495 
496   Negator N(Root->getContext(), IC.getDataLayout(), IC.getAssumptionCache(),
497             IC.getDominatorTree(), LHSIsZero);
498   Optional<Result> Res = N.run(Root);
499   if (!Res) { // Negation failed.
500     LLVM_DEBUG(dbgs() << "Negator: failed to sink negation into " << *Root
501                       << "\n");
502     return nullptr;
503   }
504 
505   LLVM_DEBUG(dbgs() << "Negator: successfully sunk negation into " << *Root
506                     << "\n         NEW: " << *Res->second << "\n");
507   ++NegatorNumTreesNegated;
508 
509   // We must temporarily unset the 'current' insertion point and DebugLoc of the
510   // InstCombine's IRBuilder so that it won't interfere with the ones we have
511   // already specified when producing negated instructions.
512   InstCombiner::BuilderTy::InsertPointGuard Guard(IC.Builder);
513   IC.Builder.ClearInsertionPoint();
514   IC.Builder.SetCurrentDebugLocation(DebugLoc());
515 
516   // And finally, we must add newly-created instructions into the InstCombine's
517   // worklist (in a proper order!) so it can attempt to combine them.
518   LLVM_DEBUG(dbgs() << "Negator: Propagating " << Res->first.size()
519                     << " instrs to InstCombine\n");
520   NegatorMaxInstructionsCreated.updateMax(Res->first.size());
521   NegatorNumInstructionsNegatedSuccess += Res->first.size();
522 
523   // They are in def-use order, so nothing fancy, just insert them in order.
524   llvm::for_each(Res->first,
525                  [&](Instruction *I) { IC.Builder.Insert(I, I->getName()); });
526 
527   // And return the new root.
528   return Res->second;
529 }
530