1 //===- Attributor.cpp - Module-wide attribute deduction -------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This file implements an inter procedural pass that deduces and/or propagating 10 // attributes. This is done in an abstract interpretation style fixpoint 11 // iteration. See the Attributor.h file comment and the class descriptions in 12 // that file for more information. 13 // 14 //===----------------------------------------------------------------------===// 15 16 #include "llvm/Transforms/IPO/Attributor.h" 17 18 #include "llvm/ADT/DepthFirstIterator.h" 19 #include "llvm/ADT/STLExtras.h" 20 #include "llvm/ADT/SmallPtrSet.h" 21 #include "llvm/ADT/SmallVector.h" 22 #include "llvm/ADT/Statistic.h" 23 #include "llvm/Analysis/CaptureTracking.h" 24 #include "llvm/Analysis/EHPersonalities.h" 25 #include "llvm/Analysis/GlobalsModRef.h" 26 #include "llvm/Analysis/Loads.h" 27 #include "llvm/Analysis/MemoryBuiltins.h" 28 #include "llvm/Analysis/ValueTracking.h" 29 #include "llvm/IR/Argument.h" 30 #include "llvm/IR/Attributes.h" 31 #include "llvm/IR/CFG.h" 32 #include "llvm/IR/InstIterator.h" 33 #include "llvm/IR/IntrinsicInst.h" 34 #include "llvm/Support/CommandLine.h" 35 #include "llvm/Support/Debug.h" 36 #include "llvm/Support/raw_ostream.h" 37 #include "llvm/Transforms/Utils/BasicBlockUtils.h" 38 #include "llvm/Transforms/Utils/Local.h" 39 40 #include <cassert> 41 42 using namespace llvm; 43 44 #define DEBUG_TYPE "attributor" 45 46 STATISTIC(NumFnWithExactDefinition, 47 "Number of function with exact definitions"); 48 STATISTIC(NumFnWithoutExactDefinition, 49 "Number of function without exact definitions"); 50 STATISTIC(NumAttributesTimedOut, 51 "Number of abstract attributes timed out before fixpoint"); 52 STATISTIC(NumAttributesValidFixpoint, 53 "Number of abstract attributes in a valid fixpoint state"); 54 STATISTIC(NumAttributesManifested, 55 "Number of abstract attributes manifested in IR"); 56 57 // Some helper macros to deal with statistics tracking. 58 // 59 // Usage: 60 // For simple IR attribute tracking overload trackStatistics in the abstract 61 // attribute and choose the right STATS_DECLTRACK_********* macro, 62 // e.g.,: 63 // void trackStatistics() const override { 64 // STATS_DECLTRACK_ARG_ATTR(returned) 65 // } 66 // If there is a single "increment" side one can use the macro 67 // STATS_DECLTRACK with a custom message. If there are multiple increment 68 // sides, STATS_DECL and STATS_TRACK can also be used separatly. 69 // 70 #define BUILD_STAT_MSG_IR_ATTR(TYPE, NAME) \ 71 ("Number of " #TYPE " marked '" #NAME "'") 72 #define BUILD_STAT_NAME(NAME, TYPE) NumIR##TYPE##_##NAME 73 #define STATS_DECL_(NAME, MSG) STATISTIC(NAME, MSG); 74 #define STATS_DECL(NAME, TYPE, MSG) \ 75 STATS_DECL_(BUILD_STAT_NAME(NAME, TYPE), MSG); 76 #define STATS_TRACK(NAME, TYPE) ++(BUILD_STAT_NAME(NAME, TYPE)); 77 #define STATS_DECLTRACK(NAME, TYPE, MSG) \ 78 { \ 79 STATS_DECL(NAME, TYPE, MSG) \ 80 STATS_TRACK(NAME, TYPE) \ 81 } 82 #define STATS_DECLTRACK_ARG_ATTR(NAME) \ 83 STATS_DECLTRACK(NAME, Arguments, BUILD_STAT_MSG_IR_ATTR(arguments, NAME)) 84 #define STATS_DECLTRACK_CSARG_ATTR(NAME) \ 85 STATS_DECLTRACK(NAME, CSArguments, \ 86 BUILD_STAT_MSG_IR_ATTR(call site arguments, NAME)) 87 #define STATS_DECLTRACK_FN_ATTR(NAME) \ 88 STATS_DECLTRACK(NAME, Function, BUILD_STAT_MSG_IR_ATTR(functions, NAME)) 89 #define STATS_DECLTRACK_CS_ATTR(NAME) \ 90 STATS_DECLTRACK(NAME, CS, BUILD_STAT_MSG_IR_ATTR(call site, NAME)) 91 #define STATS_DECLTRACK_FNRET_ATTR(NAME) \ 92 STATS_DECLTRACK(NAME, FunctionReturn, \ 93 BUILD_STAT_MSG_IR_ATTR(function returns, NAME)) 94 #define STATS_DECLTRACK_CSRET_ATTR(NAME) \ 95 STATS_DECLTRACK(NAME, CSReturn, \ 96 BUILD_STAT_MSG_IR_ATTR(call site returns, NAME)) 97 #define STATS_DECLTRACK_FLOATING_ATTR(NAME) \ 98 STATS_DECLTRACK(NAME, Floating, \ 99 ("Number of floating values known to be '" #NAME "'")) 100 101 // TODO: Determine a good default value. 102 // 103 // In the LLVM-TS and SPEC2006, 32 seems to not induce compile time overheads 104 // (when run with the first 5 abstract attributes). The results also indicate 105 // that we never reach 32 iterations but always find a fixpoint sooner. 106 // 107 // This will become more evolved once we perform two interleaved fixpoint 108 // iterations: bottom-up and top-down. 109 static cl::opt<unsigned> 110 MaxFixpointIterations("attributor-max-iterations", cl::Hidden, 111 cl::desc("Maximal number of fixpoint iterations."), 112 cl::init(32)); 113 static cl::opt<bool> VerifyMaxFixpointIterations( 114 "attributor-max-iterations-verify", cl::Hidden, 115 cl::desc("Verify that max-iterations is a tight bound for a fixpoint"), 116 cl::init(false)); 117 118 static cl::opt<bool> DisableAttributor( 119 "attributor-disable", cl::Hidden, 120 cl::desc("Disable the attributor inter-procedural deduction pass."), 121 cl::init(true)); 122 123 static cl::opt<bool> ManifestInternal( 124 "attributor-manifest-internal", cl::Hidden, 125 cl::desc("Manifest Attributor internal string attributes."), 126 cl::init(false)); 127 128 static cl::opt<unsigned> DepRecInterval( 129 "attributor-dependence-recompute-interval", cl::Hidden, 130 cl::desc("Number of iterations until dependences are recomputed."), 131 cl::init(4)); 132 133 static cl::opt<bool> EnableHeapToStack("enable-heap-to-stack-conversion", 134 cl::init(true), cl::Hidden); 135 136 static cl::opt<int> MaxHeapToStackSize("max-heap-to-stack-size", cl::init(128), 137 cl::Hidden); 138 139 /// Logic operators for the change status enum class. 140 /// 141 ///{ 142 ChangeStatus llvm::operator|(ChangeStatus l, ChangeStatus r) { 143 return l == ChangeStatus::CHANGED ? l : r; 144 } 145 ChangeStatus llvm::operator&(ChangeStatus l, ChangeStatus r) { 146 return l == ChangeStatus::UNCHANGED ? l : r; 147 } 148 ///} 149 150 /// Recursively visit all values that might become \p IRP at some point. This 151 /// will be done by looking through cast instructions, selects, phis, and calls 152 /// with the "returned" attribute. Once we cannot look through the value any 153 /// further, the callback \p VisitValueCB is invoked and passed the current 154 /// value, the \p State, and a flag to indicate if we stripped anything. To 155 /// limit how much effort is invested, we will never visit more values than 156 /// specified by \p MaxValues. 157 template <typename AAType, typename StateTy> 158 static bool genericValueTraversal( 159 Attributor &A, IRPosition IRP, const AAType &QueryingAA, StateTy &State, 160 const function_ref<bool(Value &, StateTy &, bool)> &VisitValueCB, 161 int MaxValues = 8) { 162 163 const AAIsDead *LivenessAA = nullptr; 164 if (IRP.getAnchorScope()) 165 LivenessAA = &A.getAAFor<AAIsDead>( 166 QueryingAA, IRPosition::function(*IRP.getAnchorScope()), 167 /* TrackDependence */ false); 168 bool AnyDead = false; 169 170 // TODO: Use Positions here to allow context sensitivity in VisitValueCB 171 SmallPtrSet<Value *, 16> Visited; 172 SmallVector<Value *, 16> Worklist; 173 Worklist.push_back(&IRP.getAssociatedValue()); 174 175 int Iteration = 0; 176 do { 177 Value *V = Worklist.pop_back_val(); 178 179 // Check if we should process the current value. To prevent endless 180 // recursion keep a record of the values we followed! 181 if (!Visited.insert(V).second) 182 continue; 183 184 // Make sure we limit the compile time for complex expressions. 185 if (Iteration++ >= MaxValues) 186 return false; 187 188 // Explicitly look through calls with a "returned" attribute if we do 189 // not have a pointer as stripPointerCasts only works on them. 190 Value *NewV = nullptr; 191 if (V->getType()->isPointerTy()) { 192 NewV = V->stripPointerCasts(); 193 } else { 194 CallSite CS(V); 195 if (CS && CS.getCalledFunction()) { 196 for (Argument &Arg : CS.getCalledFunction()->args()) 197 if (Arg.hasReturnedAttr()) { 198 NewV = CS.getArgOperand(Arg.getArgNo()); 199 break; 200 } 201 } 202 } 203 if (NewV && NewV != V) { 204 Worklist.push_back(NewV); 205 continue; 206 } 207 208 // Look through select instructions, visit both potential values. 209 if (auto *SI = dyn_cast<SelectInst>(V)) { 210 Worklist.push_back(SI->getTrueValue()); 211 Worklist.push_back(SI->getFalseValue()); 212 continue; 213 } 214 215 // Look through phi nodes, visit all live operands. 216 if (auto *PHI = dyn_cast<PHINode>(V)) { 217 assert(LivenessAA && 218 "Expected liveness in the presence of instructions!"); 219 for (unsigned u = 0, e = PHI->getNumIncomingValues(); u < e; u++) { 220 const BasicBlock *IncomingBB = PHI->getIncomingBlock(u); 221 if (LivenessAA->isAssumedDead(IncomingBB->getTerminator())) { 222 AnyDead = true; 223 continue; 224 } 225 Worklist.push_back(PHI->getIncomingValue(u)); 226 } 227 continue; 228 } 229 230 // Once a leaf is reached we inform the user through the callback. 231 if (!VisitValueCB(*V, State, Iteration > 1)) 232 return false; 233 } while (!Worklist.empty()); 234 235 // If we actually used liveness information so we have to record a dependence. 236 if (AnyDead) 237 A.recordDependence(*LivenessAA, QueryingAA); 238 239 // All values have been visited. 240 return true; 241 } 242 243 /// Return true if \p New is equal or worse than \p Old. 244 static bool isEqualOrWorse(const Attribute &New, const Attribute &Old) { 245 if (!Old.isIntAttribute()) 246 return true; 247 248 return Old.getValueAsInt() >= New.getValueAsInt(); 249 } 250 251 /// Return true if the information provided by \p Attr was added to the 252 /// attribute list \p Attrs. This is only the case if it was not already present 253 /// in \p Attrs at the position describe by \p PK and \p AttrIdx. 254 static bool addIfNotExistent(LLVMContext &Ctx, const Attribute &Attr, 255 AttributeList &Attrs, int AttrIdx) { 256 257 if (Attr.isEnumAttribute()) { 258 Attribute::AttrKind Kind = Attr.getKindAsEnum(); 259 if (Attrs.hasAttribute(AttrIdx, Kind)) 260 if (isEqualOrWorse(Attr, Attrs.getAttribute(AttrIdx, Kind))) 261 return false; 262 Attrs = Attrs.addAttribute(Ctx, AttrIdx, Attr); 263 return true; 264 } 265 if (Attr.isStringAttribute()) { 266 StringRef Kind = Attr.getKindAsString(); 267 if (Attrs.hasAttribute(AttrIdx, Kind)) 268 if (isEqualOrWorse(Attr, Attrs.getAttribute(AttrIdx, Kind))) 269 return false; 270 Attrs = Attrs.addAttribute(Ctx, AttrIdx, Attr); 271 return true; 272 } 273 if (Attr.isIntAttribute()) { 274 Attribute::AttrKind Kind = Attr.getKindAsEnum(); 275 if (Attrs.hasAttribute(AttrIdx, Kind)) 276 if (isEqualOrWorse(Attr, Attrs.getAttribute(AttrIdx, Kind))) 277 return false; 278 Attrs = Attrs.removeAttribute(Ctx, AttrIdx, Kind); 279 Attrs = Attrs.addAttribute(Ctx, AttrIdx, Attr); 280 return true; 281 } 282 283 llvm_unreachable("Expected enum or string attribute!"); 284 } 285 static const Value *getPointerOperand(const Instruction *I) { 286 if (auto *LI = dyn_cast<LoadInst>(I)) 287 if (!LI->isVolatile()) 288 return LI->getPointerOperand(); 289 290 if (auto *SI = dyn_cast<StoreInst>(I)) 291 if (!SI->isVolatile()) 292 return SI->getPointerOperand(); 293 294 if (auto *CXI = dyn_cast<AtomicCmpXchgInst>(I)) 295 if (!CXI->isVolatile()) 296 return CXI->getPointerOperand(); 297 298 if (auto *RMWI = dyn_cast<AtomicRMWInst>(I)) 299 if (!RMWI->isVolatile()) 300 return RMWI->getPointerOperand(); 301 302 return nullptr; 303 } 304 static const Value *getBasePointerOfAccessPointerOperand(const Instruction *I, 305 int64_t &BytesOffset, 306 const DataLayout &DL) { 307 const Value *Ptr = getPointerOperand(I); 308 if (!Ptr) 309 return nullptr; 310 311 return GetPointerBaseWithConstantOffset(Ptr, BytesOffset, DL, 312 /*AllowNonInbounds*/ false); 313 } 314 315 ChangeStatus AbstractAttribute::update(Attributor &A) { 316 ChangeStatus HasChanged = ChangeStatus::UNCHANGED; 317 if (getState().isAtFixpoint()) 318 return HasChanged; 319 320 LLVM_DEBUG(dbgs() << "[Attributor] Update: " << *this << "\n"); 321 322 HasChanged = updateImpl(A); 323 324 LLVM_DEBUG(dbgs() << "[Attributor] Update " << HasChanged << " " << *this 325 << "\n"); 326 327 return HasChanged; 328 } 329 330 ChangeStatus 331 IRAttributeManifest::manifestAttrs(Attributor &A, IRPosition &IRP, 332 const ArrayRef<Attribute> &DeducedAttrs) { 333 Function *ScopeFn = IRP.getAssociatedFunction(); 334 IRPosition::Kind PK = IRP.getPositionKind(); 335 336 // In the following some generic code that will manifest attributes in 337 // DeducedAttrs if they improve the current IR. Due to the different 338 // annotation positions we use the underlying AttributeList interface. 339 340 AttributeList Attrs; 341 switch (PK) { 342 case IRPosition::IRP_INVALID: 343 case IRPosition::IRP_FLOAT: 344 return ChangeStatus::UNCHANGED; 345 case IRPosition::IRP_ARGUMENT: 346 case IRPosition::IRP_FUNCTION: 347 case IRPosition::IRP_RETURNED: 348 Attrs = ScopeFn->getAttributes(); 349 break; 350 case IRPosition::IRP_CALL_SITE: 351 case IRPosition::IRP_CALL_SITE_RETURNED: 352 case IRPosition::IRP_CALL_SITE_ARGUMENT: 353 Attrs = ImmutableCallSite(&IRP.getAnchorValue()).getAttributes(); 354 break; 355 } 356 357 ChangeStatus HasChanged = ChangeStatus::UNCHANGED; 358 LLVMContext &Ctx = IRP.getAnchorValue().getContext(); 359 for (const Attribute &Attr : DeducedAttrs) { 360 if (!addIfNotExistent(Ctx, Attr, Attrs, IRP.getAttrIdx())) 361 continue; 362 363 HasChanged = ChangeStatus::CHANGED; 364 } 365 366 if (HasChanged == ChangeStatus::UNCHANGED) 367 return HasChanged; 368 369 switch (PK) { 370 case IRPosition::IRP_ARGUMENT: 371 case IRPosition::IRP_FUNCTION: 372 case IRPosition::IRP_RETURNED: 373 ScopeFn->setAttributes(Attrs); 374 break; 375 case IRPosition::IRP_CALL_SITE: 376 case IRPosition::IRP_CALL_SITE_RETURNED: 377 case IRPosition::IRP_CALL_SITE_ARGUMENT: 378 CallSite(&IRP.getAnchorValue()).setAttributes(Attrs); 379 break; 380 case IRPosition::IRP_INVALID: 381 case IRPosition::IRP_FLOAT: 382 break; 383 } 384 385 return HasChanged; 386 } 387 388 const IRPosition IRPosition::EmptyKey(255); 389 const IRPosition IRPosition::TombstoneKey(256); 390 391 SubsumingPositionIterator::SubsumingPositionIterator(const IRPosition &IRP) { 392 IRPositions.emplace_back(IRP); 393 394 ImmutableCallSite ICS(&IRP.getAnchorValue()); 395 switch (IRP.getPositionKind()) { 396 case IRPosition::IRP_INVALID: 397 case IRPosition::IRP_FLOAT: 398 case IRPosition::IRP_FUNCTION: 399 return; 400 case IRPosition::IRP_ARGUMENT: 401 case IRPosition::IRP_RETURNED: 402 IRPositions.emplace_back( 403 IRPosition::function(*IRP.getAssociatedFunction())); 404 return; 405 case IRPosition::IRP_CALL_SITE: 406 assert(ICS && "Expected call site!"); 407 // TODO: We need to look at the operand bundles similar to the redirection 408 // in CallBase. 409 if (!ICS.hasOperandBundles()) 410 if (const Function *Callee = ICS.getCalledFunction()) 411 IRPositions.emplace_back(IRPosition::function(*Callee)); 412 return; 413 case IRPosition::IRP_CALL_SITE_RETURNED: 414 assert(ICS && "Expected call site!"); 415 // TODO: We need to look at the operand bundles similar to the redirection 416 // in CallBase. 417 if (!ICS.hasOperandBundles()) { 418 if (const Function *Callee = ICS.getCalledFunction()) { 419 IRPositions.emplace_back(IRPosition::returned(*Callee)); 420 IRPositions.emplace_back(IRPosition::function(*Callee)); 421 } 422 } 423 IRPositions.emplace_back( 424 IRPosition::callsite_function(cast<CallBase>(*ICS.getInstruction()))); 425 return; 426 case IRPosition::IRP_CALL_SITE_ARGUMENT: { 427 int ArgNo = IRP.getArgNo(); 428 assert(ICS && ArgNo >= 0 && "Expected call site!"); 429 // TODO: We need to look at the operand bundles similar to the redirection 430 // in CallBase. 431 if (!ICS.hasOperandBundles()) { 432 const Function *Callee = ICS.getCalledFunction(); 433 if (Callee && Callee->arg_size() > unsigned(ArgNo)) 434 IRPositions.emplace_back(IRPosition::argument(*Callee->getArg(ArgNo))); 435 if (Callee) 436 IRPositions.emplace_back(IRPosition::function(*Callee)); 437 } 438 IRPositions.emplace_back(IRPosition::value(IRP.getAssociatedValue())); 439 return; 440 } 441 } 442 } 443 444 bool IRPosition::hasAttr(ArrayRef<Attribute::AttrKind> AKs, 445 bool IgnoreSubsumingPositions) const { 446 for (const IRPosition &EquivIRP : SubsumingPositionIterator(*this)) { 447 for (Attribute::AttrKind AK : AKs) 448 if (EquivIRP.getAttr(AK).getKindAsEnum() == AK) 449 return true; 450 // The first position returned by the SubsumingPositionIterator is 451 // always the position itself. If we ignore subsuming positions we 452 // are done after the first iteration. 453 if (IgnoreSubsumingPositions) 454 break; 455 } 456 return false; 457 } 458 459 void IRPosition::getAttrs(ArrayRef<Attribute::AttrKind> AKs, 460 SmallVectorImpl<Attribute> &Attrs) const { 461 for (const IRPosition &EquivIRP : SubsumingPositionIterator(*this)) 462 for (Attribute::AttrKind AK : AKs) { 463 const Attribute &Attr = EquivIRP.getAttr(AK); 464 if (Attr.getKindAsEnum() == AK) 465 Attrs.push_back(Attr); 466 } 467 } 468 469 void IRPosition::verify() { 470 switch (KindOrArgNo) { 471 default: 472 assert(KindOrArgNo >= 0 && "Expected argument or call site argument!"); 473 assert((isa<CallBase>(AnchorVal) || isa<Argument>(AnchorVal)) && 474 "Expected call base or argument for positive attribute index!"); 475 if (isa<Argument>(AnchorVal)) { 476 assert(cast<Argument>(AnchorVal)->getArgNo() == unsigned(getArgNo()) && 477 "Argument number mismatch!"); 478 assert(cast<Argument>(AnchorVal) == &getAssociatedValue() && 479 "Associated value mismatch!"); 480 } else { 481 assert(cast<CallBase>(*AnchorVal).arg_size() > unsigned(getArgNo()) && 482 "Call site argument number mismatch!"); 483 assert(cast<CallBase>(*AnchorVal).getArgOperand(getArgNo()) == 484 &getAssociatedValue() && 485 "Associated value mismatch!"); 486 } 487 break; 488 case IRP_INVALID: 489 assert(!AnchorVal && "Expected no value for an invalid position!"); 490 break; 491 case IRP_FLOAT: 492 assert((!isa<CallBase>(&getAssociatedValue()) && 493 !isa<Argument>(&getAssociatedValue())) && 494 "Expected specialized kind for call base and argument values!"); 495 break; 496 case IRP_RETURNED: 497 assert(isa<Function>(AnchorVal) && 498 "Expected function for a 'returned' position!"); 499 assert(AnchorVal == &getAssociatedValue() && "Associated value mismatch!"); 500 break; 501 case IRP_CALL_SITE_RETURNED: 502 assert((isa<CallBase>(AnchorVal)) && 503 "Expected call base for 'call site returned' position!"); 504 assert(AnchorVal == &getAssociatedValue() && "Associated value mismatch!"); 505 break; 506 case IRP_CALL_SITE: 507 assert((isa<CallBase>(AnchorVal)) && 508 "Expected call base for 'call site function' position!"); 509 assert(AnchorVal == &getAssociatedValue() && "Associated value mismatch!"); 510 break; 511 case IRP_FUNCTION: 512 assert(isa<Function>(AnchorVal) && 513 "Expected function for a 'function' position!"); 514 assert(AnchorVal == &getAssociatedValue() && "Associated value mismatch!"); 515 break; 516 } 517 } 518 519 namespace { 520 /// Helper functions to clamp a state \p S of type \p StateType with the 521 /// information in \p R and indicate/return if \p S did change (as-in update is 522 /// required to be run again). 523 /// 524 ///{ 525 template <typename StateType> 526 ChangeStatus clampStateAndIndicateChange(StateType &S, const StateType &R); 527 528 template <> 529 ChangeStatus clampStateAndIndicateChange<IntegerState>(IntegerState &S, 530 const IntegerState &R) { 531 auto Assumed = S.getAssumed(); 532 S ^= R; 533 return Assumed == S.getAssumed() ? ChangeStatus::UNCHANGED 534 : ChangeStatus::CHANGED; 535 } 536 537 template <> 538 ChangeStatus clampStateAndIndicateChange<BooleanState>(BooleanState &S, 539 const BooleanState &R) { 540 return clampStateAndIndicateChange<IntegerState>(S, R); 541 } 542 ///} 543 544 /// Clamp the information known for all returned values of a function 545 /// (identified by \p QueryingAA) into \p S. 546 template <typename AAType, typename StateType = typename AAType::StateType> 547 static void clampReturnedValueStates(Attributor &A, const AAType &QueryingAA, 548 StateType &S) { 549 LLVM_DEBUG(dbgs() << "[Attributor] Clamp return value states for " 550 << static_cast<const AbstractAttribute &>(QueryingAA) 551 << " into " << S << "\n"); 552 553 assert((QueryingAA.getIRPosition().getPositionKind() == 554 IRPosition::IRP_RETURNED || 555 QueryingAA.getIRPosition().getPositionKind() == 556 IRPosition::IRP_CALL_SITE_RETURNED) && 557 "Can only clamp returned value states for a function returned or call " 558 "site returned position!"); 559 560 // Use an optional state as there might not be any return values and we want 561 // to join (IntegerState::operator&) the state of all there are. 562 Optional<StateType> T; 563 564 // Callback for each possibly returned value. 565 auto CheckReturnValue = [&](Value &RV) -> bool { 566 const IRPosition &RVPos = IRPosition::value(RV); 567 const AAType &AA = A.getAAFor<AAType>(QueryingAA, RVPos); 568 LLVM_DEBUG(dbgs() << "[Attributor] RV: " << RV << " AA: " << AA.getAsStr() 569 << " @ " << RVPos << "\n"); 570 const StateType &AAS = static_cast<const StateType &>(AA.getState()); 571 if (T.hasValue()) 572 *T &= AAS; 573 else 574 T = AAS; 575 LLVM_DEBUG(dbgs() << "[Attributor] AA State: " << AAS << " RV State: " << T 576 << "\n"); 577 return T->isValidState(); 578 }; 579 580 if (!A.checkForAllReturnedValues(CheckReturnValue, QueryingAA)) 581 S.indicatePessimisticFixpoint(); 582 else if (T.hasValue()) 583 S ^= *T; 584 } 585 586 /// Helper class to compose two generic deduction 587 template <typename AAType, typename Base, typename StateType, 588 template <typename...> class F, template <typename...> class G> 589 struct AAComposeTwoGenericDeduction 590 : public F<AAType, G<AAType, Base, StateType>, StateType> { 591 AAComposeTwoGenericDeduction(const IRPosition &IRP) 592 : F<AAType, G<AAType, Base, StateType>, StateType>(IRP) {} 593 594 /// See AbstractAttribute::updateImpl(...). 595 ChangeStatus updateImpl(Attributor &A) override { 596 ChangeStatus ChangedF = F<AAType, G<AAType, Base, StateType>, StateType>::updateImpl(A); 597 ChangeStatus ChangedG = G<AAType, Base, StateType>::updateImpl(A); 598 return ChangedF | ChangedG; 599 } 600 }; 601 602 /// Helper class for generic deduction: return value -> returned position. 603 template <typename AAType, typename Base, 604 typename StateType = typename AAType::StateType> 605 struct AAReturnedFromReturnedValues : public Base { 606 AAReturnedFromReturnedValues(const IRPosition &IRP) : Base(IRP) {} 607 608 /// See AbstractAttribute::updateImpl(...). 609 ChangeStatus updateImpl(Attributor &A) override { 610 StateType S; 611 clampReturnedValueStates<AAType, StateType>(A, *this, S); 612 // TODO: If we know we visited all returned values, thus no are assumed 613 // dead, we can take the known information from the state T. 614 return clampStateAndIndicateChange<StateType>(this->getState(), S); 615 } 616 }; 617 618 /// Clamp the information known at all call sites for a given argument 619 /// (identified by \p QueryingAA) into \p S. 620 template <typename AAType, typename StateType = typename AAType::StateType> 621 static void clampCallSiteArgumentStates(Attributor &A, const AAType &QueryingAA, 622 StateType &S) { 623 LLVM_DEBUG(dbgs() << "[Attributor] Clamp call site argument states for " 624 << static_cast<const AbstractAttribute &>(QueryingAA) 625 << " into " << S << "\n"); 626 627 assert(QueryingAA.getIRPosition().getPositionKind() == 628 IRPosition::IRP_ARGUMENT && 629 "Can only clamp call site argument states for an argument position!"); 630 631 // Use an optional state as there might not be any return values and we want 632 // to join (IntegerState::operator&) the state of all there are. 633 Optional<StateType> T; 634 635 // The argument number which is also the call site argument number. 636 unsigned ArgNo = QueryingAA.getIRPosition().getArgNo(); 637 638 auto CallSiteCheck = [&](AbstractCallSite ACS) { 639 const IRPosition &ACSArgPos = IRPosition::callsite_argument(ACS, ArgNo); 640 // Check if a coresponding argument was found or if it is on not associated 641 // (which can happen for callback calls). 642 if (ACSArgPos.getPositionKind() == IRPosition::IRP_INVALID) 643 return false; 644 645 const AAType &AA = A.getAAFor<AAType>(QueryingAA, ACSArgPos); 646 LLVM_DEBUG(dbgs() << "[Attributor] ACS: " << *ACS.getInstruction() 647 << " AA: " << AA.getAsStr() << " @" << ACSArgPos << "\n"); 648 const StateType &AAS = static_cast<const StateType &>(AA.getState()); 649 if (T.hasValue()) 650 *T &= AAS; 651 else 652 T = AAS; 653 LLVM_DEBUG(dbgs() << "[Attributor] AA State: " << AAS << " CSA State: " << T 654 << "\n"); 655 return T->isValidState(); 656 }; 657 658 if (!A.checkForAllCallSites(CallSiteCheck, QueryingAA, true)) 659 S.indicatePessimisticFixpoint(); 660 else if (T.hasValue()) 661 S ^= *T; 662 } 663 664 /// Helper class for generic deduction: call site argument -> argument position. 665 template <typename AAType, typename Base, 666 typename StateType = typename AAType::StateType> 667 struct AAArgumentFromCallSiteArguments : public Base { 668 AAArgumentFromCallSiteArguments(const IRPosition &IRP) : Base(IRP) {} 669 670 /// See AbstractAttribute::updateImpl(...). 671 ChangeStatus updateImpl(Attributor &A) override { 672 StateType S; 673 clampCallSiteArgumentStates<AAType, StateType>(A, *this, S); 674 // TODO: If we know we visited all incoming values, thus no are assumed 675 // dead, we can take the known information from the state T. 676 return clampStateAndIndicateChange<StateType>(this->getState(), S); 677 } 678 }; 679 680 /// Helper class for generic replication: function returned -> cs returned. 681 template <typename AAType, typename Base, 682 typename StateType = typename AAType::StateType> 683 struct AACallSiteReturnedFromReturned : public Base { 684 AACallSiteReturnedFromReturned(const IRPosition &IRP) : Base(IRP) {} 685 686 /// See AbstractAttribute::updateImpl(...). 687 ChangeStatus updateImpl(Attributor &A) override { 688 assert(this->getIRPosition().getPositionKind() == 689 IRPosition::IRP_CALL_SITE_RETURNED && 690 "Can only wrap function returned positions for call site returned " 691 "positions!"); 692 auto &S = this->getState(); 693 694 const Function *AssociatedFunction = 695 this->getIRPosition().getAssociatedFunction(); 696 if (!AssociatedFunction) 697 return S.indicatePessimisticFixpoint(); 698 699 IRPosition FnPos = IRPosition::returned(*AssociatedFunction); 700 const AAType &AA = A.getAAFor<AAType>(*this, FnPos); 701 return clampStateAndIndicateChange( 702 S, static_cast<const typename AAType::StateType &>(AA.getState())); 703 } 704 }; 705 706 /// Helper class for generic deduction using must-be-executed-context 707 /// Base class is required to have `followUse` method. 708 709 /// bool followUse(Attributor &A, const Use *U, const Instruction *I) 710 /// U - Underlying use. 711 /// I - The user of the \p U. 712 /// `followUse` returns true if the value should be tracked transitively. 713 714 template <typename AAType, typename Base, 715 typename StateType = typename AAType::StateType> 716 struct AAFromMustBeExecutedContext : public Base { 717 AAFromMustBeExecutedContext(const IRPosition &IRP) : Base(IRP) {} 718 719 void initialize(Attributor &A) override { 720 Base::initialize(A); 721 IRPosition &IRP = this->getIRPosition(); 722 Instruction *CtxI = IRP.getCtxI(); 723 724 if (!CtxI) 725 return; 726 727 for (const Use &U : IRP.getAssociatedValue().uses()) 728 Uses.insert(&U); 729 } 730 731 /// See AbstractAttribute::updateImpl(...). 732 ChangeStatus updateImpl(Attributor &A) override { 733 auto BeforeState = this->getState(); 734 auto &S = this->getState(); 735 Instruction *CtxI = this->getIRPosition().getCtxI(); 736 if (!CtxI) 737 return ChangeStatus::UNCHANGED; 738 739 MustBeExecutedContextExplorer &Explorer = 740 A.getInfoCache().getMustBeExecutedContextExplorer(); 741 742 SetVector<const Use *> NextUses; 743 744 for (const Use *U : Uses) { 745 if (const Instruction *UserI = dyn_cast<Instruction>(U->getUser())) { 746 auto EIt = Explorer.begin(CtxI), EEnd = Explorer.end(CtxI); 747 bool Found = EIt.count(UserI); 748 while (!Found && ++EIt != EEnd) 749 Found = EIt.getCurrentInst() == UserI; 750 if (Found && Base::followUse(A, U, UserI)) 751 for (const Use &Us : UserI->uses()) 752 NextUses.insert(&Us); 753 } 754 } 755 for (const Use *U : NextUses) 756 Uses.insert(U); 757 758 return BeforeState == S ? ChangeStatus::UNCHANGED : ChangeStatus::CHANGED; 759 } 760 761 private: 762 /// Container for (transitive) uses of the associated value. 763 SetVector<const Use *> Uses; 764 }; 765 766 template <typename AAType, typename Base, 767 typename StateType = typename AAType::StateType> 768 using AAArgumentFromCallSiteArgumentsAndMustBeExecutedContext = 769 AAComposeTwoGenericDeduction<AAType, Base, StateType, 770 AAFromMustBeExecutedContext, 771 AAArgumentFromCallSiteArguments>; 772 773 template <typename AAType, typename Base, 774 typename StateType = typename AAType::StateType> 775 using AACallSiteReturnedFromReturnedAndMustBeExecutedContext = 776 AAComposeTwoGenericDeduction<AAType, Base, StateType, 777 AAFromMustBeExecutedContext, 778 AACallSiteReturnedFromReturned>; 779 780 /// -----------------------NoUnwind Function Attribute-------------------------- 781 782 struct AANoUnwindImpl : AANoUnwind { 783 AANoUnwindImpl(const IRPosition &IRP) : AANoUnwind(IRP) {} 784 785 const std::string getAsStr() const override { 786 return getAssumed() ? "nounwind" : "may-unwind"; 787 } 788 789 /// See AbstractAttribute::updateImpl(...). 790 ChangeStatus updateImpl(Attributor &A) override { 791 auto Opcodes = { 792 (unsigned)Instruction::Invoke, (unsigned)Instruction::CallBr, 793 (unsigned)Instruction::Call, (unsigned)Instruction::CleanupRet, 794 (unsigned)Instruction::CatchSwitch, (unsigned)Instruction::Resume}; 795 796 auto CheckForNoUnwind = [&](Instruction &I) { 797 if (!I.mayThrow()) 798 return true; 799 800 if (ImmutableCallSite ICS = ImmutableCallSite(&I)) { 801 const auto &NoUnwindAA = 802 A.getAAFor<AANoUnwind>(*this, IRPosition::callsite_function(ICS)); 803 return NoUnwindAA.isAssumedNoUnwind(); 804 } 805 return false; 806 }; 807 808 if (!A.checkForAllInstructions(CheckForNoUnwind, *this, Opcodes)) 809 return indicatePessimisticFixpoint(); 810 811 return ChangeStatus::UNCHANGED; 812 } 813 }; 814 815 struct AANoUnwindFunction final : public AANoUnwindImpl { 816 AANoUnwindFunction(const IRPosition &IRP) : AANoUnwindImpl(IRP) {} 817 818 /// See AbstractAttribute::trackStatistics() 819 void trackStatistics() const override { STATS_DECLTRACK_FN_ATTR(nounwind) } 820 }; 821 822 /// NoUnwind attribute deduction for a call sites. 823 struct AANoUnwindCallSite final : AANoUnwindImpl { 824 AANoUnwindCallSite(const IRPosition &IRP) : AANoUnwindImpl(IRP) {} 825 826 /// See AbstractAttribute::initialize(...). 827 void initialize(Attributor &A) override { 828 AANoUnwindImpl::initialize(A); 829 Function *F = getAssociatedFunction(); 830 if (!F) 831 indicatePessimisticFixpoint(); 832 } 833 834 /// See AbstractAttribute::updateImpl(...). 835 ChangeStatus updateImpl(Attributor &A) override { 836 // TODO: Once we have call site specific value information we can provide 837 // call site specific liveness information and then it makes 838 // sense to specialize attributes for call sites arguments instead of 839 // redirecting requests to the callee argument. 840 Function *F = getAssociatedFunction(); 841 const IRPosition &FnPos = IRPosition::function(*F); 842 auto &FnAA = A.getAAFor<AANoUnwind>(*this, FnPos); 843 return clampStateAndIndicateChange( 844 getState(), 845 static_cast<const AANoUnwind::StateType &>(FnAA.getState())); 846 } 847 848 /// See AbstractAttribute::trackStatistics() 849 void trackStatistics() const override { STATS_DECLTRACK_CS_ATTR(nounwind); } 850 }; 851 852 /// --------------------- Function Return Values ------------------------------- 853 854 /// "Attribute" that collects all potential returned values and the return 855 /// instructions that they arise from. 856 /// 857 /// If there is a unique returned value R, the manifest method will: 858 /// - mark R with the "returned" attribute, if R is an argument. 859 class AAReturnedValuesImpl : public AAReturnedValues, public AbstractState { 860 861 /// Mapping of values potentially returned by the associated function to the 862 /// return instructions that might return them. 863 MapVector<Value *, SmallSetVector<ReturnInst *, 4>> ReturnedValues; 864 865 /// Mapping to remember the number of returned values for a call site such 866 /// that we can avoid updates if nothing changed. 867 DenseMap<const CallBase *, unsigned> NumReturnedValuesPerKnownAA; 868 869 /// Set of unresolved calls returned by the associated function. 870 SmallSetVector<CallBase *, 4> UnresolvedCalls; 871 872 /// State flags 873 /// 874 ///{ 875 bool IsFixed = false; 876 bool IsValidState = true; 877 ///} 878 879 public: 880 AAReturnedValuesImpl(const IRPosition &IRP) : AAReturnedValues(IRP) {} 881 882 /// See AbstractAttribute::initialize(...). 883 void initialize(Attributor &A) override { 884 // Reset the state. 885 IsFixed = false; 886 IsValidState = true; 887 ReturnedValues.clear(); 888 889 Function *F = getAssociatedFunction(); 890 if (!F) { 891 indicatePessimisticFixpoint(); 892 return; 893 } 894 895 // The map from instruction opcodes to those instructions in the function. 896 auto &OpcodeInstMap = A.getInfoCache().getOpcodeInstMapForFunction(*F); 897 898 // Look through all arguments, if one is marked as returned we are done. 899 for (Argument &Arg : F->args()) { 900 if (Arg.hasReturnedAttr()) { 901 auto &ReturnInstSet = ReturnedValues[&Arg]; 902 for (Instruction *RI : OpcodeInstMap[Instruction::Ret]) 903 ReturnInstSet.insert(cast<ReturnInst>(RI)); 904 905 indicateOptimisticFixpoint(); 906 return; 907 } 908 } 909 910 if (!F->hasExactDefinition()) 911 indicatePessimisticFixpoint(); 912 } 913 914 /// See AbstractAttribute::manifest(...). 915 ChangeStatus manifest(Attributor &A) override; 916 917 /// See AbstractAttribute::getState(...). 918 AbstractState &getState() override { return *this; } 919 920 /// See AbstractAttribute::getState(...). 921 const AbstractState &getState() const override { return *this; } 922 923 /// See AbstractAttribute::updateImpl(Attributor &A). 924 ChangeStatus updateImpl(Attributor &A) override; 925 926 llvm::iterator_range<iterator> returned_values() override { 927 return llvm::make_range(ReturnedValues.begin(), ReturnedValues.end()); 928 } 929 930 llvm::iterator_range<const_iterator> returned_values() const override { 931 return llvm::make_range(ReturnedValues.begin(), ReturnedValues.end()); 932 } 933 934 const SmallSetVector<CallBase *, 4> &getUnresolvedCalls() const override { 935 return UnresolvedCalls; 936 } 937 938 /// Return the number of potential return values, -1 if unknown. 939 size_t getNumReturnValues() const override { 940 return isValidState() ? ReturnedValues.size() : -1; 941 } 942 943 /// Return an assumed unique return value if a single candidate is found. If 944 /// there cannot be one, return a nullptr. If it is not clear yet, return the 945 /// Optional::NoneType. 946 Optional<Value *> getAssumedUniqueReturnValue(Attributor &A) const; 947 948 /// See AbstractState::checkForAllReturnedValues(...). 949 bool checkForAllReturnedValuesAndReturnInsts( 950 const function_ref<bool(Value &, const SmallSetVector<ReturnInst *, 4> &)> 951 &Pred) const override; 952 953 /// Pretty print the attribute similar to the IR representation. 954 const std::string getAsStr() const override; 955 956 /// See AbstractState::isAtFixpoint(). 957 bool isAtFixpoint() const override { return IsFixed; } 958 959 /// See AbstractState::isValidState(). 960 bool isValidState() const override { return IsValidState; } 961 962 /// See AbstractState::indicateOptimisticFixpoint(...). 963 ChangeStatus indicateOptimisticFixpoint() override { 964 IsFixed = true; 965 return ChangeStatus::UNCHANGED; 966 } 967 968 ChangeStatus indicatePessimisticFixpoint() override { 969 IsFixed = true; 970 IsValidState = false; 971 return ChangeStatus::CHANGED; 972 } 973 }; 974 975 ChangeStatus AAReturnedValuesImpl::manifest(Attributor &A) { 976 ChangeStatus Changed = ChangeStatus::UNCHANGED; 977 978 // Bookkeeping. 979 assert(isValidState()); 980 STATS_DECLTRACK(KnownReturnValues, FunctionReturn, 981 "Number of function with known return values"); 982 983 // Check if we have an assumed unique return value that we could manifest. 984 Optional<Value *> UniqueRV = getAssumedUniqueReturnValue(A); 985 986 if (!UniqueRV.hasValue() || !UniqueRV.getValue()) 987 return Changed; 988 989 // Bookkeeping. 990 STATS_DECLTRACK(UniqueReturnValue, FunctionReturn, 991 "Number of function with unique return"); 992 993 // Callback to replace the uses of CB with the constant C. 994 auto ReplaceCallSiteUsersWith = [](CallBase &CB, Constant &C) { 995 if (CB.getNumUses() == 0 || CB.isMustTailCall()) 996 return ChangeStatus::UNCHANGED; 997 CB.replaceAllUsesWith(&C); 998 return ChangeStatus::CHANGED; 999 }; 1000 1001 // If the assumed unique return value is an argument, annotate it. 1002 if (auto *UniqueRVArg = dyn_cast<Argument>(UniqueRV.getValue())) { 1003 getIRPosition() = IRPosition::argument(*UniqueRVArg); 1004 Changed = IRAttribute::manifest(A); 1005 } else if (auto *RVC = dyn_cast<Constant>(UniqueRV.getValue())) { 1006 // We can replace the returned value with the unique returned constant. 1007 Value &AnchorValue = getAnchorValue(); 1008 if (Function *F = dyn_cast<Function>(&AnchorValue)) { 1009 for (const Use &U : F->uses()) 1010 if (CallBase *CB = dyn_cast<CallBase>(U.getUser())) 1011 if (CB->isCallee(&U)) { 1012 Constant *RVCCast = 1013 ConstantExpr::getTruncOrBitCast(RVC, CB->getType()); 1014 Changed = ReplaceCallSiteUsersWith(*CB, *RVCCast) | Changed; 1015 } 1016 } else { 1017 assert(isa<CallBase>(AnchorValue) && 1018 "Expcected a function or call base anchor!"); 1019 Constant *RVCCast = 1020 ConstantExpr::getTruncOrBitCast(RVC, AnchorValue.getType()); 1021 Changed = ReplaceCallSiteUsersWith(cast<CallBase>(AnchorValue), *RVCCast); 1022 } 1023 if (Changed == ChangeStatus::CHANGED) 1024 STATS_DECLTRACK(UniqueConstantReturnValue, FunctionReturn, 1025 "Number of function returns replaced by constant return"); 1026 } 1027 1028 return Changed; 1029 } 1030 1031 const std::string AAReturnedValuesImpl::getAsStr() const { 1032 return (isAtFixpoint() ? "returns(#" : "may-return(#") + 1033 (isValidState() ? std::to_string(getNumReturnValues()) : "?") + 1034 ")[#UC: " + std::to_string(UnresolvedCalls.size()) + "]"; 1035 } 1036 1037 Optional<Value *> 1038 AAReturnedValuesImpl::getAssumedUniqueReturnValue(Attributor &A) const { 1039 // If checkForAllReturnedValues provides a unique value, ignoring potential 1040 // undef values that can also be present, it is assumed to be the actual 1041 // return value and forwarded to the caller of this method. If there are 1042 // multiple, a nullptr is returned indicating there cannot be a unique 1043 // returned value. 1044 Optional<Value *> UniqueRV; 1045 1046 auto Pred = [&](Value &RV) -> bool { 1047 // If we found a second returned value and neither the current nor the saved 1048 // one is an undef, there is no unique returned value. Undefs are special 1049 // since we can pretend they have any value. 1050 if (UniqueRV.hasValue() && UniqueRV != &RV && 1051 !(isa<UndefValue>(RV) || isa<UndefValue>(UniqueRV.getValue()))) { 1052 UniqueRV = nullptr; 1053 return false; 1054 } 1055 1056 // Do not overwrite a value with an undef. 1057 if (!UniqueRV.hasValue() || !isa<UndefValue>(RV)) 1058 UniqueRV = &RV; 1059 1060 return true; 1061 }; 1062 1063 if (!A.checkForAllReturnedValues(Pred, *this)) 1064 UniqueRV = nullptr; 1065 1066 return UniqueRV; 1067 } 1068 1069 bool AAReturnedValuesImpl::checkForAllReturnedValuesAndReturnInsts( 1070 const function_ref<bool(Value &, const SmallSetVector<ReturnInst *, 4> &)> 1071 &Pred) const { 1072 if (!isValidState()) 1073 return false; 1074 1075 // Check all returned values but ignore call sites as long as we have not 1076 // encountered an overdefined one during an update. 1077 for (auto &It : ReturnedValues) { 1078 Value *RV = It.first; 1079 1080 CallBase *CB = dyn_cast<CallBase>(RV); 1081 if (CB && !UnresolvedCalls.count(CB)) 1082 continue; 1083 1084 if (!Pred(*RV, It.second)) 1085 return false; 1086 } 1087 1088 return true; 1089 } 1090 1091 ChangeStatus AAReturnedValuesImpl::updateImpl(Attributor &A) { 1092 size_t NumUnresolvedCalls = UnresolvedCalls.size(); 1093 bool Changed = false; 1094 1095 // State used in the value traversals starting in returned values. 1096 struct RVState { 1097 // The map in which we collect return values -> return instrs. 1098 decltype(ReturnedValues) &RetValsMap; 1099 // The flag to indicate a change. 1100 bool &Changed; 1101 // The return instrs we come from. 1102 SmallSetVector<ReturnInst *, 4> RetInsts; 1103 }; 1104 1105 // Callback for a leaf value returned by the associated function. 1106 auto VisitValueCB = [](Value &Val, RVState &RVS, bool) -> bool { 1107 auto Size = RVS.RetValsMap[&Val].size(); 1108 RVS.RetValsMap[&Val].insert(RVS.RetInsts.begin(), RVS.RetInsts.end()); 1109 bool Inserted = RVS.RetValsMap[&Val].size() != Size; 1110 RVS.Changed |= Inserted; 1111 LLVM_DEBUG({ 1112 if (Inserted) 1113 dbgs() << "[AAReturnedValues] 1 Add new returned value " << Val 1114 << " => " << RVS.RetInsts.size() << "\n"; 1115 }); 1116 return true; 1117 }; 1118 1119 // Helper method to invoke the generic value traversal. 1120 auto VisitReturnedValue = [&](Value &RV, RVState &RVS) { 1121 IRPosition RetValPos = IRPosition::value(RV); 1122 return genericValueTraversal<AAReturnedValues, RVState>(A, RetValPos, *this, 1123 RVS, VisitValueCB); 1124 }; 1125 1126 // Callback for all "return intructions" live in the associated function. 1127 auto CheckReturnInst = [this, &VisitReturnedValue, &Changed](Instruction &I) { 1128 ReturnInst &Ret = cast<ReturnInst>(I); 1129 RVState RVS({ReturnedValues, Changed, {}}); 1130 RVS.RetInsts.insert(&Ret); 1131 return VisitReturnedValue(*Ret.getReturnValue(), RVS); 1132 }; 1133 1134 // Start by discovering returned values from all live returned instructions in 1135 // the associated function. 1136 if (!A.checkForAllInstructions(CheckReturnInst, *this, {Instruction::Ret})) 1137 return indicatePessimisticFixpoint(); 1138 1139 // Once returned values "directly" present in the code are handled we try to 1140 // resolve returned calls. 1141 decltype(ReturnedValues) NewRVsMap; 1142 for (auto &It : ReturnedValues) { 1143 LLVM_DEBUG(dbgs() << "[AAReturnedValues] Returned value: " << *It.first 1144 << " by #" << It.second.size() << " RIs\n"); 1145 CallBase *CB = dyn_cast<CallBase>(It.first); 1146 if (!CB || UnresolvedCalls.count(CB)) 1147 continue; 1148 1149 if (!CB->getCalledFunction()) { 1150 LLVM_DEBUG(dbgs() << "[AAReturnedValues] Unresolved call: " << *CB 1151 << "\n"); 1152 UnresolvedCalls.insert(CB); 1153 continue; 1154 } 1155 1156 // TODO: use the function scope once we have call site AAReturnedValues. 1157 const auto &RetValAA = A.getAAFor<AAReturnedValues>( 1158 *this, IRPosition::function(*CB->getCalledFunction())); 1159 LLVM_DEBUG(dbgs() << "[AAReturnedValues] Found another AAReturnedValues: " 1160 << static_cast<const AbstractAttribute &>(RetValAA) 1161 << "\n"); 1162 1163 // Skip dead ends, thus if we do not know anything about the returned 1164 // call we mark it as unresolved and it will stay that way. 1165 if (!RetValAA.getState().isValidState()) { 1166 LLVM_DEBUG(dbgs() << "[AAReturnedValues] Unresolved call: " << *CB 1167 << "\n"); 1168 UnresolvedCalls.insert(CB); 1169 continue; 1170 } 1171 1172 // Do not try to learn partial information. If the callee has unresolved 1173 // return values we will treat the call as unresolved/opaque. 1174 auto &RetValAAUnresolvedCalls = RetValAA.getUnresolvedCalls(); 1175 if (!RetValAAUnresolvedCalls.empty()) { 1176 UnresolvedCalls.insert(CB); 1177 continue; 1178 } 1179 1180 // Now check if we can track transitively returned values. If possible, thus 1181 // if all return value can be represented in the current scope, do so. 1182 bool Unresolved = false; 1183 for (auto &RetValAAIt : RetValAA.returned_values()) { 1184 Value *RetVal = RetValAAIt.first; 1185 if (isa<Argument>(RetVal) || isa<CallBase>(RetVal) || 1186 isa<Constant>(RetVal)) 1187 continue; 1188 // Anything that did not fit in the above categories cannot be resolved, 1189 // mark the call as unresolved. 1190 LLVM_DEBUG(dbgs() << "[AAReturnedValues] transitively returned value " 1191 "cannot be translated: " 1192 << *RetVal << "\n"); 1193 UnresolvedCalls.insert(CB); 1194 Unresolved = true; 1195 break; 1196 } 1197 1198 if (Unresolved) 1199 continue; 1200 1201 // Now track transitively returned values. 1202 unsigned &NumRetAA = NumReturnedValuesPerKnownAA[CB]; 1203 if (NumRetAA == RetValAA.getNumReturnValues()) { 1204 LLVM_DEBUG(dbgs() << "[AAReturnedValues] Skip call as it has not " 1205 "changed since it was seen last\n"); 1206 continue; 1207 } 1208 NumRetAA = RetValAA.getNumReturnValues(); 1209 1210 for (auto &RetValAAIt : RetValAA.returned_values()) { 1211 Value *RetVal = RetValAAIt.first; 1212 if (Argument *Arg = dyn_cast<Argument>(RetVal)) { 1213 // Arguments are mapped to call site operands and we begin the traversal 1214 // again. 1215 bool Unused = false; 1216 RVState RVS({NewRVsMap, Unused, RetValAAIt.second}); 1217 VisitReturnedValue(*CB->getArgOperand(Arg->getArgNo()), RVS); 1218 continue; 1219 } else if (isa<CallBase>(RetVal)) { 1220 // Call sites are resolved by the callee attribute over time, no need to 1221 // do anything for us. 1222 continue; 1223 } else if (isa<Constant>(RetVal)) { 1224 // Constants are valid everywhere, we can simply take them. 1225 NewRVsMap[RetVal].insert(It.second.begin(), It.second.end()); 1226 continue; 1227 } 1228 } 1229 } 1230 1231 // To avoid modifications to the ReturnedValues map while we iterate over it 1232 // we kept record of potential new entries in a copy map, NewRVsMap. 1233 for (auto &It : NewRVsMap) { 1234 assert(!It.second.empty() && "Entry does not add anything."); 1235 auto &ReturnInsts = ReturnedValues[It.first]; 1236 for (ReturnInst *RI : It.second) 1237 if (ReturnInsts.insert(RI)) { 1238 LLVM_DEBUG(dbgs() << "[AAReturnedValues] Add new returned value " 1239 << *It.first << " => " << *RI << "\n"); 1240 Changed = true; 1241 } 1242 } 1243 1244 Changed |= (NumUnresolvedCalls != UnresolvedCalls.size()); 1245 return Changed ? ChangeStatus::CHANGED : ChangeStatus::UNCHANGED; 1246 } 1247 1248 struct AAReturnedValuesFunction final : public AAReturnedValuesImpl { 1249 AAReturnedValuesFunction(const IRPosition &IRP) : AAReturnedValuesImpl(IRP) {} 1250 1251 /// See AbstractAttribute::trackStatistics() 1252 void trackStatistics() const override { STATS_DECLTRACK_ARG_ATTR(returned) } 1253 }; 1254 1255 /// Returned values information for a call sites. 1256 struct AAReturnedValuesCallSite final : AAReturnedValuesImpl { 1257 AAReturnedValuesCallSite(const IRPosition &IRP) : AAReturnedValuesImpl(IRP) {} 1258 1259 /// See AbstractAttribute::initialize(...). 1260 void initialize(Attributor &A) override { 1261 // TODO: Once we have call site specific value information we can provide 1262 // call site specific liveness information and then it makes 1263 // sense to specialize attributes for call sites instead of 1264 // redirecting requests to the callee. 1265 llvm_unreachable("Abstract attributes for returned values are not " 1266 "supported for call sites yet!"); 1267 } 1268 1269 /// See AbstractAttribute::updateImpl(...). 1270 ChangeStatus updateImpl(Attributor &A) override { 1271 return indicatePessimisticFixpoint(); 1272 } 1273 1274 /// See AbstractAttribute::trackStatistics() 1275 void trackStatistics() const override {} 1276 }; 1277 1278 /// ------------------------ NoSync Function Attribute ------------------------- 1279 1280 struct AANoSyncImpl : AANoSync { 1281 AANoSyncImpl(const IRPosition &IRP) : AANoSync(IRP) {} 1282 1283 const std::string getAsStr() const override { 1284 return getAssumed() ? "nosync" : "may-sync"; 1285 } 1286 1287 /// See AbstractAttribute::updateImpl(...). 1288 ChangeStatus updateImpl(Attributor &A) override; 1289 1290 /// Helper function used to determine whether an instruction is non-relaxed 1291 /// atomic. In other words, if an atomic instruction does not have unordered 1292 /// or monotonic ordering 1293 static bool isNonRelaxedAtomic(Instruction *I); 1294 1295 /// Helper function used to determine whether an instruction is volatile. 1296 static bool isVolatile(Instruction *I); 1297 1298 /// Helper function uset to check if intrinsic is volatile (memcpy, memmove, 1299 /// memset). 1300 static bool isNoSyncIntrinsic(Instruction *I); 1301 }; 1302 1303 bool AANoSyncImpl::isNonRelaxedAtomic(Instruction *I) { 1304 if (!I->isAtomic()) 1305 return false; 1306 1307 AtomicOrdering Ordering; 1308 switch (I->getOpcode()) { 1309 case Instruction::AtomicRMW: 1310 Ordering = cast<AtomicRMWInst>(I)->getOrdering(); 1311 break; 1312 case Instruction::Store: 1313 Ordering = cast<StoreInst>(I)->getOrdering(); 1314 break; 1315 case Instruction::Load: 1316 Ordering = cast<LoadInst>(I)->getOrdering(); 1317 break; 1318 case Instruction::Fence: { 1319 auto *FI = cast<FenceInst>(I); 1320 if (FI->getSyncScopeID() == SyncScope::SingleThread) 1321 return false; 1322 Ordering = FI->getOrdering(); 1323 break; 1324 } 1325 case Instruction::AtomicCmpXchg: { 1326 AtomicOrdering Success = cast<AtomicCmpXchgInst>(I)->getSuccessOrdering(); 1327 AtomicOrdering Failure = cast<AtomicCmpXchgInst>(I)->getFailureOrdering(); 1328 // Only if both are relaxed, than it can be treated as relaxed. 1329 // Otherwise it is non-relaxed. 1330 if (Success != AtomicOrdering::Unordered && 1331 Success != AtomicOrdering::Monotonic) 1332 return true; 1333 if (Failure != AtomicOrdering::Unordered && 1334 Failure != AtomicOrdering::Monotonic) 1335 return true; 1336 return false; 1337 } 1338 default: 1339 llvm_unreachable( 1340 "New atomic operations need to be known in the attributor."); 1341 } 1342 1343 // Relaxed. 1344 if (Ordering == AtomicOrdering::Unordered || 1345 Ordering == AtomicOrdering::Monotonic) 1346 return false; 1347 return true; 1348 } 1349 1350 /// Checks if an intrinsic is nosync. Currently only checks mem* intrinsics. 1351 /// FIXME: We should ipmrove the handling of intrinsics. 1352 bool AANoSyncImpl::isNoSyncIntrinsic(Instruction *I) { 1353 if (auto *II = dyn_cast<IntrinsicInst>(I)) { 1354 switch (II->getIntrinsicID()) { 1355 /// Element wise atomic memory intrinsics are can only be unordered, 1356 /// therefore nosync. 1357 case Intrinsic::memset_element_unordered_atomic: 1358 case Intrinsic::memmove_element_unordered_atomic: 1359 case Intrinsic::memcpy_element_unordered_atomic: 1360 return true; 1361 case Intrinsic::memset: 1362 case Intrinsic::memmove: 1363 case Intrinsic::memcpy: 1364 if (!cast<MemIntrinsic>(II)->isVolatile()) 1365 return true; 1366 return false; 1367 default: 1368 return false; 1369 } 1370 } 1371 return false; 1372 } 1373 1374 bool AANoSyncImpl::isVolatile(Instruction *I) { 1375 assert(!ImmutableCallSite(I) && !isa<CallBase>(I) && 1376 "Calls should not be checked here"); 1377 1378 switch (I->getOpcode()) { 1379 case Instruction::AtomicRMW: 1380 return cast<AtomicRMWInst>(I)->isVolatile(); 1381 case Instruction::Store: 1382 return cast<StoreInst>(I)->isVolatile(); 1383 case Instruction::Load: 1384 return cast<LoadInst>(I)->isVolatile(); 1385 case Instruction::AtomicCmpXchg: 1386 return cast<AtomicCmpXchgInst>(I)->isVolatile(); 1387 default: 1388 return false; 1389 } 1390 } 1391 1392 ChangeStatus AANoSyncImpl::updateImpl(Attributor &A) { 1393 1394 auto CheckRWInstForNoSync = [&](Instruction &I) { 1395 /// We are looking for volatile instructions or Non-Relaxed atomics. 1396 /// FIXME: We should ipmrove the handling of intrinsics. 1397 1398 if (isa<IntrinsicInst>(&I) && isNoSyncIntrinsic(&I)) 1399 return true; 1400 1401 if (ImmutableCallSite ICS = ImmutableCallSite(&I)) { 1402 if (ICS.hasFnAttr(Attribute::NoSync)) 1403 return true; 1404 1405 const auto &NoSyncAA = 1406 A.getAAFor<AANoSync>(*this, IRPosition::callsite_function(ICS)); 1407 if (NoSyncAA.isAssumedNoSync()) 1408 return true; 1409 return false; 1410 } 1411 1412 if (!isVolatile(&I) && !isNonRelaxedAtomic(&I)) 1413 return true; 1414 1415 return false; 1416 }; 1417 1418 auto CheckForNoSync = [&](Instruction &I) { 1419 // At this point we handled all read/write effects and they are all 1420 // nosync, so they can be skipped. 1421 if (I.mayReadOrWriteMemory()) 1422 return true; 1423 1424 // non-convergent and readnone imply nosync. 1425 return !ImmutableCallSite(&I).isConvergent(); 1426 }; 1427 1428 if (!A.checkForAllReadWriteInstructions(CheckRWInstForNoSync, *this) || 1429 !A.checkForAllCallLikeInstructions(CheckForNoSync, *this)) 1430 return indicatePessimisticFixpoint(); 1431 1432 return ChangeStatus::UNCHANGED; 1433 } 1434 1435 struct AANoSyncFunction final : public AANoSyncImpl { 1436 AANoSyncFunction(const IRPosition &IRP) : AANoSyncImpl(IRP) {} 1437 1438 /// See AbstractAttribute::trackStatistics() 1439 void trackStatistics() const override { STATS_DECLTRACK_FN_ATTR(nosync) } 1440 }; 1441 1442 /// NoSync attribute deduction for a call sites. 1443 struct AANoSyncCallSite final : AANoSyncImpl { 1444 AANoSyncCallSite(const IRPosition &IRP) : AANoSyncImpl(IRP) {} 1445 1446 /// See AbstractAttribute::initialize(...). 1447 void initialize(Attributor &A) override { 1448 AANoSyncImpl::initialize(A); 1449 Function *F = getAssociatedFunction(); 1450 if (!F) 1451 indicatePessimisticFixpoint(); 1452 } 1453 1454 /// See AbstractAttribute::updateImpl(...). 1455 ChangeStatus updateImpl(Attributor &A) override { 1456 // TODO: Once we have call site specific value information we can provide 1457 // call site specific liveness information and then it makes 1458 // sense to specialize attributes for call sites arguments instead of 1459 // redirecting requests to the callee argument. 1460 Function *F = getAssociatedFunction(); 1461 const IRPosition &FnPos = IRPosition::function(*F); 1462 auto &FnAA = A.getAAFor<AANoSync>(*this, FnPos); 1463 return clampStateAndIndicateChange( 1464 getState(), static_cast<const AANoSync::StateType &>(FnAA.getState())); 1465 } 1466 1467 /// See AbstractAttribute::trackStatistics() 1468 void trackStatistics() const override { STATS_DECLTRACK_CS_ATTR(nosync); } 1469 }; 1470 1471 /// ------------------------ No-Free Attributes ---------------------------- 1472 1473 struct AANoFreeImpl : public AANoFree { 1474 AANoFreeImpl(const IRPosition &IRP) : AANoFree(IRP) {} 1475 1476 /// See AbstractAttribute::updateImpl(...). 1477 ChangeStatus updateImpl(Attributor &A) override { 1478 auto CheckForNoFree = [&](Instruction &I) { 1479 ImmutableCallSite ICS(&I); 1480 if (ICS.hasFnAttr(Attribute::NoFree)) 1481 return true; 1482 1483 const auto &NoFreeAA = 1484 A.getAAFor<AANoFree>(*this, IRPosition::callsite_function(ICS)); 1485 return NoFreeAA.isAssumedNoFree(); 1486 }; 1487 1488 if (!A.checkForAllCallLikeInstructions(CheckForNoFree, *this)) 1489 return indicatePessimisticFixpoint(); 1490 return ChangeStatus::UNCHANGED; 1491 } 1492 1493 /// See AbstractAttribute::getAsStr(). 1494 const std::string getAsStr() const override { 1495 return getAssumed() ? "nofree" : "may-free"; 1496 } 1497 }; 1498 1499 struct AANoFreeFunction final : public AANoFreeImpl { 1500 AANoFreeFunction(const IRPosition &IRP) : AANoFreeImpl(IRP) {} 1501 1502 /// See AbstractAttribute::trackStatistics() 1503 void trackStatistics() const override { STATS_DECLTRACK_FN_ATTR(nofree) } 1504 }; 1505 1506 /// NoFree attribute deduction for a call sites. 1507 struct AANoFreeCallSite final : AANoFreeImpl { 1508 AANoFreeCallSite(const IRPosition &IRP) : AANoFreeImpl(IRP) {} 1509 1510 /// See AbstractAttribute::initialize(...). 1511 void initialize(Attributor &A) override { 1512 AANoFreeImpl::initialize(A); 1513 Function *F = getAssociatedFunction(); 1514 if (!F) 1515 indicatePessimisticFixpoint(); 1516 } 1517 1518 /// See AbstractAttribute::updateImpl(...). 1519 ChangeStatus updateImpl(Attributor &A) override { 1520 // TODO: Once we have call site specific value information we can provide 1521 // call site specific liveness information and then it makes 1522 // sense to specialize attributes for call sites arguments instead of 1523 // redirecting requests to the callee argument. 1524 Function *F = getAssociatedFunction(); 1525 const IRPosition &FnPos = IRPosition::function(*F); 1526 auto &FnAA = A.getAAFor<AANoFree>(*this, FnPos); 1527 return clampStateAndIndicateChange( 1528 getState(), static_cast<const AANoFree::StateType &>(FnAA.getState())); 1529 } 1530 1531 /// See AbstractAttribute::trackStatistics() 1532 void trackStatistics() const override { STATS_DECLTRACK_CS_ATTR(nofree); } 1533 }; 1534 1535 /// ------------------------ NonNull Argument Attribute ------------------------ 1536 static int64_t getKnownNonNullAndDerefBytesForUse( 1537 Attributor &A, AbstractAttribute &QueryingAA, Value &AssociatedValue, 1538 const Use *U, const Instruction *I, bool &IsNonNull, bool &TrackUse) { 1539 TrackUse = false; 1540 1541 const Value *UseV = U->get(); 1542 if (!UseV->getType()->isPointerTy()) 1543 return 0; 1544 1545 Type *PtrTy = UseV->getType(); 1546 const Function *F = I->getFunction(); 1547 bool NullPointerIsDefined = 1548 F ? llvm::NullPointerIsDefined(F, PtrTy->getPointerAddressSpace()) : true; 1549 const DataLayout &DL = A.getInfoCache().getDL(); 1550 if (ImmutableCallSite ICS = ImmutableCallSite(I)) { 1551 if (ICS.isBundleOperand(U)) 1552 return 0; 1553 1554 if (ICS.isCallee(U)) { 1555 IsNonNull |= !NullPointerIsDefined; 1556 return 0; 1557 } 1558 1559 unsigned ArgNo = ICS.getArgumentNo(U); 1560 IRPosition IRP = IRPosition::callsite_argument(ICS, ArgNo); 1561 auto &DerefAA = A.getAAFor<AADereferenceable>(QueryingAA, IRP); 1562 IsNonNull |= DerefAA.isKnownNonNull(); 1563 return DerefAA.getKnownDereferenceableBytes(); 1564 } 1565 1566 int64_t Offset; 1567 if (const Value *Base = getBasePointerOfAccessPointerOperand(I, Offset, DL)) { 1568 if (Base == &AssociatedValue && getPointerOperand(I) == UseV) { 1569 int64_t DerefBytes = 1570 Offset + (int64_t)DL.getTypeStoreSize(PtrTy->getPointerElementType()); 1571 1572 IsNonNull |= !NullPointerIsDefined; 1573 return DerefBytes; 1574 } 1575 } 1576 if (const Value *Base = 1577 GetPointerBaseWithConstantOffset(UseV, Offset, DL, 1578 /*AllowNonInbounds*/ false)) { 1579 auto &DerefAA = 1580 A.getAAFor<AADereferenceable>(QueryingAA, IRPosition::value(*Base)); 1581 IsNonNull |= (!NullPointerIsDefined && DerefAA.isKnownNonNull()); 1582 IsNonNull |= (!NullPointerIsDefined && (Offset != 0)); 1583 int64_t DerefBytes = DerefAA.getKnownDereferenceableBytes(); 1584 return std::max(int64_t(0), DerefBytes - Offset); 1585 } 1586 1587 return 0; 1588 } 1589 1590 struct AANonNullImpl : AANonNull { 1591 AANonNullImpl(const IRPosition &IRP) 1592 : AANonNull(IRP), 1593 NullIsDefined(NullPointerIsDefined( 1594 getAnchorScope(), 1595 getAssociatedValue().getType()->getPointerAddressSpace())) {} 1596 1597 /// See AbstractAttribute::initialize(...). 1598 void initialize(Attributor &A) override { 1599 if (!NullIsDefined && 1600 hasAttr({Attribute::NonNull, Attribute::Dereferenceable})) 1601 indicateOptimisticFixpoint(); 1602 else 1603 AANonNull::initialize(A); 1604 } 1605 1606 /// See AAFromMustBeExecutedContext 1607 bool followUse(Attributor &A, const Use *U, const Instruction *I) { 1608 bool IsNonNull = false; 1609 bool TrackUse = false; 1610 getKnownNonNullAndDerefBytesForUse(A, *this, getAssociatedValue(), U, I, 1611 IsNonNull, TrackUse); 1612 takeKnownMaximum(IsNonNull); 1613 return TrackUse; 1614 } 1615 1616 /// See AbstractAttribute::getAsStr(). 1617 const std::string getAsStr() const override { 1618 return getAssumed() ? "nonnull" : "may-null"; 1619 } 1620 1621 /// Flag to determine if the underlying value can be null and still allow 1622 /// valid accesses. 1623 const bool NullIsDefined; 1624 }; 1625 1626 /// NonNull attribute for a floating value. 1627 struct AANonNullFloating 1628 : AAFromMustBeExecutedContext<AANonNull, AANonNullImpl> { 1629 using Base = AAFromMustBeExecutedContext<AANonNull, AANonNullImpl>; 1630 AANonNullFloating(const IRPosition &IRP) : Base(IRP) {} 1631 1632 /// See AbstractAttribute::initialize(...). 1633 void initialize(Attributor &A) override { 1634 Base::initialize(A); 1635 1636 if (isAtFixpoint()) 1637 return; 1638 1639 const IRPosition &IRP = getIRPosition(); 1640 const Value &V = IRP.getAssociatedValue(); 1641 const DataLayout &DL = A.getDataLayout(); 1642 1643 // TODO: This context sensitive query should be removed once we can do 1644 // context sensitive queries in the genericValueTraversal below. 1645 if (isKnownNonZero(&V, DL, 0, /* TODO: AC */ nullptr, IRP.getCtxI(), 1646 /* TODO: DT */ nullptr)) 1647 indicateOptimisticFixpoint(); 1648 } 1649 1650 /// See AbstractAttribute::updateImpl(...). 1651 ChangeStatus updateImpl(Attributor &A) override { 1652 ChangeStatus Change = Base::updateImpl(A); 1653 if (isKnownNonNull()) 1654 return Change; 1655 1656 if (!NullIsDefined) { 1657 const auto &DerefAA = A.getAAFor<AADereferenceable>(*this, getIRPosition()); 1658 if (DerefAA.getAssumedDereferenceableBytes()) 1659 return Change; 1660 } 1661 1662 const DataLayout &DL = A.getDataLayout(); 1663 1664 auto VisitValueCB = [&](Value &V, AAAlign::StateType &T, 1665 bool Stripped) -> bool { 1666 const auto &AA = A.getAAFor<AANonNull>(*this, IRPosition::value(V)); 1667 if (!Stripped && this == &AA) { 1668 if (!isKnownNonZero(&V, DL, 0, /* TODO: AC */ nullptr, 1669 /* CtxI */ getCtxI(), 1670 /* TODO: DT */ nullptr)) 1671 T.indicatePessimisticFixpoint(); 1672 } else { 1673 // Use abstract attribute information. 1674 const AANonNull::StateType &NS = 1675 static_cast<const AANonNull::StateType &>(AA.getState()); 1676 T ^= NS; 1677 } 1678 return T.isValidState(); 1679 }; 1680 1681 StateType T; 1682 if (!genericValueTraversal<AANonNull, StateType>(A, getIRPosition(), *this, 1683 T, VisitValueCB)) 1684 return indicatePessimisticFixpoint(); 1685 1686 return clampStateAndIndicateChange(getState(), T); 1687 } 1688 1689 /// See AbstractAttribute::trackStatistics() 1690 void trackStatistics() const override { STATS_DECLTRACK_FNRET_ATTR(nonnull) } 1691 }; 1692 1693 /// NonNull attribute for function return value. 1694 struct AANonNullReturned final 1695 : AAReturnedFromReturnedValues<AANonNull, AANonNullImpl> { 1696 AANonNullReturned(const IRPosition &IRP) 1697 : AAReturnedFromReturnedValues<AANonNull, AANonNullImpl>(IRP) {} 1698 1699 /// See AbstractAttribute::trackStatistics() 1700 void trackStatistics() const override { STATS_DECLTRACK_FNRET_ATTR(nonnull) } 1701 }; 1702 1703 /// NonNull attribute for function argument. 1704 struct AANonNullArgument final 1705 : AAArgumentFromCallSiteArgumentsAndMustBeExecutedContext<AANonNull, 1706 AANonNullImpl> { 1707 AANonNullArgument(const IRPosition &IRP) 1708 : AAArgumentFromCallSiteArgumentsAndMustBeExecutedContext<AANonNull, 1709 AANonNullImpl>( 1710 IRP) {} 1711 1712 /// See AbstractAttribute::trackStatistics() 1713 void trackStatistics() const override { STATS_DECLTRACK_ARG_ATTR(nonnull) } 1714 }; 1715 1716 struct AANonNullCallSiteArgument final : AANonNullFloating { 1717 AANonNullCallSiteArgument(const IRPosition &IRP) : AANonNullFloating(IRP) {} 1718 1719 /// See AbstractAttribute::trackStatistics() 1720 void trackStatistics() const override { STATS_DECLTRACK_CSARG_ATTR(nonnull) } 1721 }; 1722 1723 /// NonNull attribute for a call site return position. 1724 struct AANonNullCallSiteReturned final 1725 : AACallSiteReturnedFromReturnedAndMustBeExecutedContext<AANonNull, 1726 AANonNullImpl> { 1727 AANonNullCallSiteReturned(const IRPosition &IRP) 1728 : AACallSiteReturnedFromReturnedAndMustBeExecutedContext<AANonNull, 1729 AANonNullImpl>( 1730 IRP) {} 1731 1732 /// See AbstractAttribute::trackStatistics() 1733 void trackStatistics() const override { STATS_DECLTRACK_CSRET_ATTR(nonnull) } 1734 }; 1735 1736 /// ------------------------ No-Recurse Attributes ---------------------------- 1737 1738 struct AANoRecurseImpl : public AANoRecurse { 1739 AANoRecurseImpl(const IRPosition &IRP) : AANoRecurse(IRP) {} 1740 1741 /// See AbstractAttribute::getAsStr() 1742 const std::string getAsStr() const override { 1743 return getAssumed() ? "norecurse" : "may-recurse"; 1744 } 1745 }; 1746 1747 struct AANoRecurseFunction final : AANoRecurseImpl { 1748 AANoRecurseFunction(const IRPosition &IRP) : AANoRecurseImpl(IRP) {} 1749 1750 /// See AbstractAttribute::initialize(...). 1751 void initialize(Attributor &A) override { 1752 AANoRecurseImpl::initialize(A); 1753 if (const Function *F = getAnchorScope()) 1754 if (A.getInfoCache().getSccSize(*F) == 1) 1755 return; 1756 indicatePessimisticFixpoint(); 1757 } 1758 1759 /// See AbstractAttribute::updateImpl(...). 1760 ChangeStatus updateImpl(Attributor &A) override { 1761 1762 auto CheckForNoRecurse = [&](Instruction &I) { 1763 ImmutableCallSite ICS(&I); 1764 if (ICS.hasFnAttr(Attribute::NoRecurse)) 1765 return true; 1766 1767 const auto &NoRecurseAA = 1768 A.getAAFor<AANoRecurse>(*this, IRPosition::callsite_function(ICS)); 1769 if (!NoRecurseAA.isAssumedNoRecurse()) 1770 return false; 1771 1772 // Recursion to the same function 1773 if (ICS.getCalledFunction() == getAnchorScope()) 1774 return false; 1775 1776 return true; 1777 }; 1778 1779 if (!A.checkForAllCallLikeInstructions(CheckForNoRecurse, *this)) 1780 return indicatePessimisticFixpoint(); 1781 return ChangeStatus::UNCHANGED; 1782 } 1783 1784 void trackStatistics() const override { STATS_DECLTRACK_FN_ATTR(norecurse) } 1785 }; 1786 1787 /// NoRecurse attribute deduction for a call sites. 1788 struct AANoRecurseCallSite final : AANoRecurseImpl { 1789 AANoRecurseCallSite(const IRPosition &IRP) : AANoRecurseImpl(IRP) {} 1790 1791 /// See AbstractAttribute::initialize(...). 1792 void initialize(Attributor &A) override { 1793 AANoRecurseImpl::initialize(A); 1794 Function *F = getAssociatedFunction(); 1795 if (!F) 1796 indicatePessimisticFixpoint(); 1797 } 1798 1799 /// See AbstractAttribute::updateImpl(...). 1800 ChangeStatus updateImpl(Attributor &A) override { 1801 // TODO: Once we have call site specific value information we can provide 1802 // call site specific liveness information and then it makes 1803 // sense to specialize attributes for call sites arguments instead of 1804 // redirecting requests to the callee argument. 1805 Function *F = getAssociatedFunction(); 1806 const IRPosition &FnPos = IRPosition::function(*F); 1807 auto &FnAA = A.getAAFor<AANoRecurse>(*this, FnPos); 1808 return clampStateAndIndicateChange( 1809 getState(), 1810 static_cast<const AANoRecurse::StateType &>(FnAA.getState())); 1811 } 1812 1813 /// See AbstractAttribute::trackStatistics() 1814 void trackStatistics() const override { STATS_DECLTRACK_CS_ATTR(norecurse); } 1815 }; 1816 1817 /// ------------------------ Will-Return Attributes ---------------------------- 1818 1819 // Helper function that checks whether a function has any cycle. 1820 // TODO: Replace with more efficent code 1821 static bool containsCycle(Function &F) { 1822 SmallPtrSet<BasicBlock *, 32> Visited; 1823 1824 // Traverse BB by dfs and check whether successor is already visited. 1825 for (BasicBlock *BB : depth_first(&F)) { 1826 Visited.insert(BB); 1827 for (auto *SuccBB : successors(BB)) { 1828 if (Visited.count(SuccBB)) 1829 return true; 1830 } 1831 } 1832 return false; 1833 } 1834 1835 // Helper function that checks the function have a loop which might become an 1836 // endless loop 1837 // FIXME: Any cycle is regarded as endless loop for now. 1838 // We have to allow some patterns. 1839 static bool containsPossiblyEndlessLoop(Function *F) { 1840 return !F || !F->hasExactDefinition() || containsCycle(*F); 1841 } 1842 1843 struct AAWillReturnImpl : public AAWillReturn { 1844 AAWillReturnImpl(const IRPosition &IRP) : AAWillReturn(IRP) {} 1845 1846 /// See AbstractAttribute::initialize(...). 1847 void initialize(Attributor &A) override { 1848 AAWillReturn::initialize(A); 1849 1850 Function *F = getAssociatedFunction(); 1851 if (containsPossiblyEndlessLoop(F)) 1852 indicatePessimisticFixpoint(); 1853 } 1854 1855 /// See AbstractAttribute::updateImpl(...). 1856 ChangeStatus updateImpl(Attributor &A) override { 1857 auto CheckForWillReturn = [&](Instruction &I) { 1858 IRPosition IPos = IRPosition::callsite_function(ImmutableCallSite(&I)); 1859 const auto &WillReturnAA = A.getAAFor<AAWillReturn>(*this, IPos); 1860 if (WillReturnAA.isKnownWillReturn()) 1861 return true; 1862 if (!WillReturnAA.isAssumedWillReturn()) 1863 return false; 1864 const auto &NoRecurseAA = A.getAAFor<AANoRecurse>(*this, IPos); 1865 return NoRecurseAA.isAssumedNoRecurse(); 1866 }; 1867 1868 if (!A.checkForAllCallLikeInstructions(CheckForWillReturn, *this)) 1869 return indicatePessimisticFixpoint(); 1870 1871 return ChangeStatus::UNCHANGED; 1872 } 1873 1874 /// See AbstractAttribute::getAsStr() 1875 const std::string getAsStr() const override { 1876 return getAssumed() ? "willreturn" : "may-noreturn"; 1877 } 1878 }; 1879 1880 struct AAWillReturnFunction final : AAWillReturnImpl { 1881 AAWillReturnFunction(const IRPosition &IRP) : AAWillReturnImpl(IRP) {} 1882 1883 /// See AbstractAttribute::trackStatistics() 1884 void trackStatistics() const override { STATS_DECLTRACK_FN_ATTR(willreturn) } 1885 }; 1886 1887 /// WillReturn attribute deduction for a call sites. 1888 struct AAWillReturnCallSite final : AAWillReturnImpl { 1889 AAWillReturnCallSite(const IRPosition &IRP) : AAWillReturnImpl(IRP) {} 1890 1891 /// See AbstractAttribute::initialize(...). 1892 void initialize(Attributor &A) override { 1893 AAWillReturnImpl::initialize(A); 1894 Function *F = getAssociatedFunction(); 1895 if (!F) 1896 indicatePessimisticFixpoint(); 1897 } 1898 1899 /// See AbstractAttribute::updateImpl(...). 1900 ChangeStatus updateImpl(Attributor &A) override { 1901 // TODO: Once we have call site specific value information we can provide 1902 // call site specific liveness information and then it makes 1903 // sense to specialize attributes for call sites arguments instead of 1904 // redirecting requests to the callee argument. 1905 Function *F = getAssociatedFunction(); 1906 const IRPosition &FnPos = IRPosition::function(*F); 1907 auto &FnAA = A.getAAFor<AAWillReturn>(*this, FnPos); 1908 return clampStateAndIndicateChange( 1909 getState(), 1910 static_cast<const AAWillReturn::StateType &>(FnAA.getState())); 1911 } 1912 1913 /// See AbstractAttribute::trackStatistics() 1914 void trackStatistics() const override { STATS_DECLTRACK_CS_ATTR(willreturn); } 1915 }; 1916 1917 /// ------------------------ NoAlias Argument Attribute ------------------------ 1918 1919 struct AANoAliasImpl : AANoAlias { 1920 AANoAliasImpl(const IRPosition &IRP) : AANoAlias(IRP) {} 1921 1922 const std::string getAsStr() const override { 1923 return getAssumed() ? "noalias" : "may-alias"; 1924 } 1925 }; 1926 1927 /// NoAlias attribute for a floating value. 1928 struct AANoAliasFloating final : AANoAliasImpl { 1929 AANoAliasFloating(const IRPosition &IRP) : AANoAliasImpl(IRP) {} 1930 1931 /// See AbstractAttribute::initialize(...). 1932 void initialize(Attributor &A) override { 1933 AANoAliasImpl::initialize(A); 1934 Value &Val = getAssociatedValue(); 1935 if (isa<AllocaInst>(Val)) 1936 indicateOptimisticFixpoint(); 1937 if (isa<ConstantPointerNull>(Val) && 1938 Val.getType()->getPointerAddressSpace() == 0) 1939 indicateOptimisticFixpoint(); 1940 } 1941 1942 /// See AbstractAttribute::updateImpl(...). 1943 ChangeStatus updateImpl(Attributor &A) override { 1944 // TODO: Implement this. 1945 return indicatePessimisticFixpoint(); 1946 } 1947 1948 /// See AbstractAttribute::trackStatistics() 1949 void trackStatistics() const override { 1950 STATS_DECLTRACK_FLOATING_ATTR(noalias) 1951 } 1952 }; 1953 1954 /// NoAlias attribute for an argument. 1955 struct AANoAliasArgument final 1956 : AAArgumentFromCallSiteArguments<AANoAlias, AANoAliasImpl> { 1957 AANoAliasArgument(const IRPosition &IRP) 1958 : AAArgumentFromCallSiteArguments<AANoAlias, AANoAliasImpl>(IRP) {} 1959 1960 /// See AbstractAttribute::trackStatistics() 1961 void trackStatistics() const override { STATS_DECLTRACK_ARG_ATTR(noalias) } 1962 }; 1963 1964 struct AANoAliasCallSiteArgument final : AANoAliasImpl { 1965 AANoAliasCallSiteArgument(const IRPosition &IRP) : AANoAliasImpl(IRP) {} 1966 1967 /// See AbstractAttribute::initialize(...). 1968 void initialize(Attributor &A) override { 1969 // See callsite argument attribute and callee argument attribute. 1970 ImmutableCallSite ICS(&getAnchorValue()); 1971 if (ICS.paramHasAttr(getArgNo(), Attribute::NoAlias)) 1972 indicateOptimisticFixpoint(); 1973 } 1974 1975 /// See AbstractAttribute::updateImpl(...). 1976 ChangeStatus updateImpl(Attributor &A) override { 1977 // We can deduce "noalias" if the following conditions hold. 1978 // (i) Associated value is assumed to be noalias in the definition. 1979 // (ii) Associated value is assumed to be no-capture in all the uses 1980 // possibly executed before this callsite. 1981 // (iii) There is no other pointer argument which could alias with the 1982 // value. 1983 1984 const Value &V = getAssociatedValue(); 1985 const IRPosition IRP = IRPosition::value(V); 1986 1987 // (i) Check whether noalias holds in the definition. 1988 1989 auto &NoAliasAA = A.getAAFor<AANoAlias>(*this, IRP); 1990 1991 if (!NoAliasAA.isAssumedNoAlias()) 1992 return indicatePessimisticFixpoint(); 1993 1994 LLVM_DEBUG(dbgs() << "[Attributor][AANoAliasCSArg] " << V 1995 << " is assumed NoAlias in the definition\n"); 1996 1997 // (ii) Check whether the value is captured in the scope using AANoCapture. 1998 // FIXME: This is conservative though, it is better to look at CFG and 1999 // check only uses possibly executed before this callsite. 2000 2001 auto &NoCaptureAA = A.getAAFor<AANoCapture>(*this, IRP); 2002 if (!NoCaptureAA.isAssumedNoCaptureMaybeReturned()) { 2003 LLVM_DEBUG( 2004 dbgs() << "[Attributor][AANoAliasCSArg] " << V 2005 << " cannot be noalias as it is potentially captured\n"); 2006 return indicatePessimisticFixpoint(); 2007 } 2008 2009 // (iii) Check there is no other pointer argument which could alias with the 2010 // value. 2011 ImmutableCallSite ICS(&getAnchorValue()); 2012 for (unsigned i = 0; i < ICS.getNumArgOperands(); i++) { 2013 if (getArgNo() == (int)i) 2014 continue; 2015 const Value *ArgOp = ICS.getArgOperand(i); 2016 if (!ArgOp->getType()->isPointerTy()) 2017 continue; 2018 2019 if (const Function *F = getAnchorScope()) { 2020 if (AAResults *AAR = A.getInfoCache().getAAResultsForFunction(*F)) { 2021 bool IsAliasing = AAR->isNoAlias(&getAssociatedValue(), ArgOp); 2022 LLVM_DEBUG(dbgs() 2023 << "[Attributor][NoAliasCSArg] Check alias between " 2024 "callsite arguments " 2025 << AAR->isNoAlias(&getAssociatedValue(), ArgOp) << " " 2026 << getAssociatedValue() << " " << *ArgOp << " => " 2027 << (IsAliasing ? "" : "no-") << "alias \n"); 2028 2029 if (IsAliasing) 2030 continue; 2031 } 2032 } 2033 return indicatePessimisticFixpoint(); 2034 } 2035 2036 return ChangeStatus::UNCHANGED; 2037 } 2038 2039 /// See AbstractAttribute::trackStatistics() 2040 void trackStatistics() const override { STATS_DECLTRACK_CSARG_ATTR(noalias) } 2041 }; 2042 2043 /// NoAlias attribute for function return value. 2044 struct AANoAliasReturned final : AANoAliasImpl { 2045 AANoAliasReturned(const IRPosition &IRP) : AANoAliasImpl(IRP) {} 2046 2047 /// See AbstractAttribute::updateImpl(...). 2048 virtual ChangeStatus updateImpl(Attributor &A) override { 2049 2050 auto CheckReturnValue = [&](Value &RV) -> bool { 2051 if (Constant *C = dyn_cast<Constant>(&RV)) 2052 if (C->isNullValue() || isa<UndefValue>(C)) 2053 return true; 2054 2055 /// For now, we can only deduce noalias if we have call sites. 2056 /// FIXME: add more support. 2057 ImmutableCallSite ICS(&RV); 2058 if (!ICS) 2059 return false; 2060 2061 const IRPosition &RVPos = IRPosition::value(RV); 2062 const auto &NoAliasAA = A.getAAFor<AANoAlias>(*this, RVPos); 2063 if (!NoAliasAA.isAssumedNoAlias()) 2064 return false; 2065 2066 const auto &NoCaptureAA = A.getAAFor<AANoCapture>(*this, RVPos); 2067 return NoCaptureAA.isAssumedNoCaptureMaybeReturned(); 2068 }; 2069 2070 if (!A.checkForAllReturnedValues(CheckReturnValue, *this)) 2071 return indicatePessimisticFixpoint(); 2072 2073 return ChangeStatus::UNCHANGED; 2074 } 2075 2076 /// See AbstractAttribute::trackStatistics() 2077 void trackStatistics() const override { STATS_DECLTRACK_FNRET_ATTR(noalias) } 2078 }; 2079 2080 /// NoAlias attribute deduction for a call site return value. 2081 struct AANoAliasCallSiteReturned final : AANoAliasImpl { 2082 AANoAliasCallSiteReturned(const IRPosition &IRP) : AANoAliasImpl(IRP) {} 2083 2084 /// See AbstractAttribute::initialize(...). 2085 void initialize(Attributor &A) override { 2086 AANoAliasImpl::initialize(A); 2087 Function *F = getAssociatedFunction(); 2088 if (!F) 2089 indicatePessimisticFixpoint(); 2090 } 2091 2092 /// See AbstractAttribute::updateImpl(...). 2093 ChangeStatus updateImpl(Attributor &A) override { 2094 // TODO: Once we have call site specific value information we can provide 2095 // call site specific liveness information and then it makes 2096 // sense to specialize attributes for call sites arguments instead of 2097 // redirecting requests to the callee argument. 2098 Function *F = getAssociatedFunction(); 2099 const IRPosition &FnPos = IRPosition::returned(*F); 2100 auto &FnAA = A.getAAFor<AANoAlias>(*this, FnPos); 2101 return clampStateAndIndicateChange( 2102 getState(), static_cast<const AANoAlias::StateType &>(FnAA.getState())); 2103 } 2104 2105 /// See AbstractAttribute::trackStatistics() 2106 void trackStatistics() const override { STATS_DECLTRACK_CSRET_ATTR(noalias); } 2107 }; 2108 2109 /// -------------------AAIsDead Function Attribute----------------------- 2110 2111 struct AAIsDeadImpl : public AAIsDead { 2112 AAIsDeadImpl(const IRPosition &IRP) : AAIsDead(IRP) {} 2113 2114 void initialize(Attributor &A) override { 2115 const Function *F = getAssociatedFunction(); 2116 if (F && !F->isDeclaration()) 2117 exploreFromEntry(A, F); 2118 } 2119 2120 void exploreFromEntry(Attributor &A, const Function *F) { 2121 ToBeExploredPaths.insert(&(F->getEntryBlock().front())); 2122 2123 for (size_t i = 0; i < ToBeExploredPaths.size(); ++i) 2124 if (const Instruction *NextNoReturnI = 2125 findNextNoReturn(A, ToBeExploredPaths[i])) 2126 NoReturnCalls.insert(NextNoReturnI); 2127 2128 // Mark the block live after we looked for no-return instructions. 2129 assumeLive(A, F->getEntryBlock()); 2130 } 2131 2132 /// Find the next assumed noreturn instruction in the block of \p I starting 2133 /// from, thus including, \p I. 2134 /// 2135 /// The caller is responsible to monitor the ToBeExploredPaths set as new 2136 /// instructions discovered in other basic block will be placed in there. 2137 /// 2138 /// \returns The next assumed noreturn instructions in the block of \p I 2139 /// starting from, thus including, \p I. 2140 const Instruction *findNextNoReturn(Attributor &A, const Instruction *I); 2141 2142 /// See AbstractAttribute::getAsStr(). 2143 const std::string getAsStr() const override { 2144 return "Live[#BB " + std::to_string(AssumedLiveBlocks.size()) + "/" + 2145 std::to_string(getAssociatedFunction()->size()) + "][#NRI " + 2146 std::to_string(NoReturnCalls.size()) + "]"; 2147 } 2148 2149 /// See AbstractAttribute::manifest(...). 2150 ChangeStatus manifest(Attributor &A) override { 2151 assert(getState().isValidState() && 2152 "Attempted to manifest an invalid state!"); 2153 2154 ChangeStatus HasChanged = ChangeStatus::UNCHANGED; 2155 Function &F = *getAssociatedFunction(); 2156 2157 if (AssumedLiveBlocks.empty()) { 2158 A.deleteAfterManifest(F); 2159 return ChangeStatus::CHANGED; 2160 } 2161 2162 // Flag to determine if we can change an invoke to a call assuming the 2163 // callee is nounwind. This is not possible if the personality of the 2164 // function allows to catch asynchronous exceptions. 2165 bool Invoke2CallAllowed = !mayCatchAsynchronousExceptions(F); 2166 2167 for (const Instruction *NRC : NoReturnCalls) { 2168 Instruction *I = const_cast<Instruction *>(NRC); 2169 BasicBlock *BB = I->getParent(); 2170 Instruction *SplitPos = I->getNextNode(); 2171 // TODO: mark stuff before unreachable instructions as dead. 2172 2173 if (auto *II = dyn_cast<InvokeInst>(I)) { 2174 // If we keep the invoke the split position is at the beginning of the 2175 // normal desitination block (it invokes a noreturn function after all). 2176 BasicBlock *NormalDestBB = II->getNormalDest(); 2177 SplitPos = &NormalDestBB->front(); 2178 2179 /// Invoke is replaced with a call and unreachable is placed after it if 2180 /// the callee is nounwind and noreturn. Otherwise, we keep the invoke 2181 /// and only place an unreachable in the normal successor. 2182 if (Invoke2CallAllowed) { 2183 if (II->getCalledFunction()) { 2184 const IRPosition &IPos = IRPosition::callsite_function(*II); 2185 const auto &AANoUnw = A.getAAFor<AANoUnwind>(*this, IPos); 2186 if (AANoUnw.isAssumedNoUnwind()) { 2187 LLVM_DEBUG(dbgs() 2188 << "[AAIsDead] Replace invoke with call inst\n"); 2189 // We do not need an invoke (II) but instead want a call followed 2190 // by an unreachable. However, we do not remove II as other 2191 // abstract attributes might have it cached as part of their 2192 // results. Given that we modify the CFG anyway, we simply keep II 2193 // around but in a new dead block. To avoid II being live through 2194 // a different edge we have to ensure the block we place it in is 2195 // only reached from the current block of II and then not reached 2196 // at all when we insert the unreachable. 2197 SplitBlockPredecessors(NormalDestBB, {BB}, ".i2c"); 2198 CallInst *CI = createCallMatchingInvoke(II); 2199 CI->insertBefore(II); 2200 CI->takeName(II); 2201 II->replaceAllUsesWith(CI); 2202 SplitPos = CI->getNextNode(); 2203 } 2204 } 2205 } 2206 2207 if (SplitPos == &NormalDestBB->front()) { 2208 // If this is an invoke of a noreturn function the edge to the normal 2209 // destination block is dead but not necessarily the block itself. 2210 // TODO: We need to move to an edge based system during deduction and 2211 // also manifest. 2212 assert(!NormalDestBB->isLandingPad() && 2213 "Expected the normal destination not to be a landingpad!"); 2214 if (NormalDestBB->getUniquePredecessor() == BB) { 2215 assumeLive(A, *NormalDestBB); 2216 } else { 2217 BasicBlock *SplitBB = 2218 SplitBlockPredecessors(NormalDestBB, {BB}, ".dead"); 2219 // The split block is live even if it contains only an unreachable 2220 // instruction at the end. 2221 assumeLive(A, *SplitBB); 2222 SplitPos = SplitBB->getTerminator(); 2223 HasChanged = ChangeStatus::CHANGED; 2224 } 2225 } 2226 } 2227 2228 if (isa_and_nonnull<UnreachableInst>(SplitPos)) 2229 continue; 2230 2231 BB = SplitPos->getParent(); 2232 SplitBlock(BB, SplitPos); 2233 changeToUnreachable(BB->getTerminator(), /* UseLLVMTrap */ false); 2234 HasChanged = ChangeStatus::CHANGED; 2235 } 2236 2237 for (BasicBlock &BB : F) 2238 if (!AssumedLiveBlocks.count(&BB)) 2239 A.deleteAfterManifest(BB); 2240 2241 return HasChanged; 2242 } 2243 2244 /// See AbstractAttribute::updateImpl(...). 2245 ChangeStatus updateImpl(Attributor &A) override; 2246 2247 /// See AAIsDead::isAssumedDead(BasicBlock *). 2248 bool isAssumedDead(const BasicBlock *BB) const override { 2249 assert(BB->getParent() == getAssociatedFunction() && 2250 "BB must be in the same anchor scope function."); 2251 2252 if (!getAssumed()) 2253 return false; 2254 return !AssumedLiveBlocks.count(BB); 2255 } 2256 2257 /// See AAIsDead::isKnownDead(BasicBlock *). 2258 bool isKnownDead(const BasicBlock *BB) const override { 2259 return getKnown() && isAssumedDead(BB); 2260 } 2261 2262 /// See AAIsDead::isAssumed(Instruction *I). 2263 bool isAssumedDead(const Instruction *I) const override { 2264 assert(I->getParent()->getParent() == getAssociatedFunction() && 2265 "Instruction must be in the same anchor scope function."); 2266 2267 if (!getAssumed()) 2268 return false; 2269 2270 // If it is not in AssumedLiveBlocks then it for sure dead. 2271 // Otherwise, it can still be after noreturn call in a live block. 2272 if (!AssumedLiveBlocks.count(I->getParent())) 2273 return true; 2274 2275 // If it is not after a noreturn call, than it is live. 2276 return isAfterNoReturn(I); 2277 } 2278 2279 /// See AAIsDead::isKnownDead(Instruction *I). 2280 bool isKnownDead(const Instruction *I) const override { 2281 return getKnown() && isAssumedDead(I); 2282 } 2283 2284 /// Check if instruction is after noreturn call, in other words, assumed dead. 2285 bool isAfterNoReturn(const Instruction *I) const; 2286 2287 /// Determine if \p F might catch asynchronous exceptions. 2288 static bool mayCatchAsynchronousExceptions(const Function &F) { 2289 return F.hasPersonalityFn() && !canSimplifyInvokeNoUnwind(&F); 2290 } 2291 2292 /// Assume \p BB is (partially) live now and indicate to the Attributor \p A 2293 /// that internal function called from \p BB should now be looked at. 2294 void assumeLive(Attributor &A, const BasicBlock &BB) { 2295 if (!AssumedLiveBlocks.insert(&BB).second) 2296 return; 2297 2298 // We assume that all of BB is (probably) live now and if there are calls to 2299 // internal functions we will assume that those are now live as well. This 2300 // is a performance optimization for blocks with calls to a lot of internal 2301 // functions. It can however cause dead functions to be treated as live. 2302 for (const Instruction &I : BB) 2303 if (ImmutableCallSite ICS = ImmutableCallSite(&I)) 2304 if (const Function *F = ICS.getCalledFunction()) 2305 if (F->hasLocalLinkage()) 2306 A.markLiveInternalFunction(*F); 2307 } 2308 2309 /// Collection of to be explored paths. 2310 SmallSetVector<const Instruction *, 8> ToBeExploredPaths; 2311 2312 /// Collection of all assumed live BasicBlocks. 2313 DenseSet<const BasicBlock *> AssumedLiveBlocks; 2314 2315 /// Collection of calls with noreturn attribute, assumed or knwon. 2316 SmallSetVector<const Instruction *, 4> NoReturnCalls; 2317 }; 2318 2319 struct AAIsDeadFunction final : public AAIsDeadImpl { 2320 AAIsDeadFunction(const IRPosition &IRP) : AAIsDeadImpl(IRP) {} 2321 2322 /// See AbstractAttribute::trackStatistics() 2323 void trackStatistics() const override { 2324 STATS_DECL(PartiallyDeadBlocks, Function, 2325 "Number of basic blocks classified as partially dead"); 2326 BUILD_STAT_NAME(PartiallyDeadBlocks, Function) += NoReturnCalls.size(); 2327 } 2328 }; 2329 2330 bool AAIsDeadImpl::isAfterNoReturn(const Instruction *I) const { 2331 const Instruction *PrevI = I->getPrevNode(); 2332 while (PrevI) { 2333 if (NoReturnCalls.count(PrevI)) 2334 return true; 2335 PrevI = PrevI->getPrevNode(); 2336 } 2337 return false; 2338 } 2339 2340 const Instruction *AAIsDeadImpl::findNextNoReturn(Attributor &A, 2341 const Instruction *I) { 2342 const BasicBlock *BB = I->getParent(); 2343 const Function &F = *BB->getParent(); 2344 2345 // Flag to determine if we can change an invoke to a call assuming the callee 2346 // is nounwind. This is not possible if the personality of the function allows 2347 // to catch asynchronous exceptions. 2348 bool Invoke2CallAllowed = !mayCatchAsynchronousExceptions(F); 2349 2350 // TODO: We should have a function that determines if an "edge" is dead. 2351 // Edges could be from an instruction to the next or from a terminator 2352 // to the successor. For now, we need to special case the unwind block 2353 // of InvokeInst below. 2354 2355 while (I) { 2356 ImmutableCallSite ICS(I); 2357 2358 if (ICS) { 2359 const IRPosition &IPos = IRPosition::callsite_function(ICS); 2360 // Regarless of the no-return property of an invoke instruction we only 2361 // learn that the regular successor is not reachable through this 2362 // instruction but the unwind block might still be. 2363 if (auto *Invoke = dyn_cast<InvokeInst>(I)) { 2364 // Use nounwind to justify the unwind block is dead as well. 2365 const auto &AANoUnw = A.getAAFor<AANoUnwind>(*this, IPos); 2366 if (!Invoke2CallAllowed || !AANoUnw.isAssumedNoUnwind()) { 2367 assumeLive(A, *Invoke->getUnwindDest()); 2368 ToBeExploredPaths.insert(&Invoke->getUnwindDest()->front()); 2369 } 2370 } 2371 2372 const auto &NoReturnAA = A.getAAFor<AANoReturn>(*this, IPos); 2373 if (NoReturnAA.isAssumedNoReturn()) 2374 return I; 2375 } 2376 2377 I = I->getNextNode(); 2378 } 2379 2380 // get new paths (reachable blocks). 2381 for (const BasicBlock *SuccBB : successors(BB)) { 2382 assumeLive(A, *SuccBB); 2383 ToBeExploredPaths.insert(&SuccBB->front()); 2384 } 2385 2386 // No noreturn instruction found. 2387 return nullptr; 2388 } 2389 2390 ChangeStatus AAIsDeadImpl::updateImpl(Attributor &A) { 2391 ChangeStatus Status = ChangeStatus::UNCHANGED; 2392 2393 // Temporary collection to iterate over existing noreturn instructions. This 2394 // will alow easier modification of NoReturnCalls collection 2395 SmallVector<const Instruction *, 8> NoReturnChanged; 2396 2397 for (const Instruction *I : NoReturnCalls) 2398 NoReturnChanged.push_back(I); 2399 2400 for (const Instruction *I : NoReturnChanged) { 2401 size_t Size = ToBeExploredPaths.size(); 2402 2403 const Instruction *NextNoReturnI = findNextNoReturn(A, I); 2404 if (NextNoReturnI != I) { 2405 Status = ChangeStatus::CHANGED; 2406 NoReturnCalls.remove(I); 2407 if (NextNoReturnI) 2408 NoReturnCalls.insert(NextNoReturnI); 2409 } 2410 2411 // Explore new paths. 2412 while (Size != ToBeExploredPaths.size()) { 2413 Status = ChangeStatus::CHANGED; 2414 if (const Instruction *NextNoReturnI = 2415 findNextNoReturn(A, ToBeExploredPaths[Size++])) 2416 NoReturnCalls.insert(NextNoReturnI); 2417 } 2418 } 2419 2420 LLVM_DEBUG(dbgs() << "[AAIsDead] AssumedLiveBlocks: " 2421 << AssumedLiveBlocks.size() << " Total number of blocks: " 2422 << getAssociatedFunction()->size() << "\n"); 2423 2424 // If we know everything is live there is no need to query for liveness. 2425 if (NoReturnCalls.empty() && 2426 getAssociatedFunction()->size() == AssumedLiveBlocks.size()) { 2427 // Indicating a pessimistic fixpoint will cause the state to be "invalid" 2428 // which will cause the Attributor to not return the AAIsDead on request, 2429 // which will prevent us from querying isAssumedDead(). 2430 indicatePessimisticFixpoint(); 2431 assert(!isValidState() && "Expected an invalid state!"); 2432 Status = ChangeStatus::CHANGED; 2433 } 2434 2435 return Status; 2436 } 2437 2438 /// Liveness information for a call sites. 2439 struct AAIsDeadCallSite final : AAIsDeadImpl { 2440 AAIsDeadCallSite(const IRPosition &IRP) : AAIsDeadImpl(IRP) {} 2441 2442 /// See AbstractAttribute::initialize(...). 2443 void initialize(Attributor &A) override { 2444 // TODO: Once we have call site specific value information we can provide 2445 // call site specific liveness information and then it makes 2446 // sense to specialize attributes for call sites instead of 2447 // redirecting requests to the callee. 2448 llvm_unreachable("Abstract attributes for liveness are not " 2449 "supported for call sites yet!"); 2450 } 2451 2452 /// See AbstractAttribute::updateImpl(...). 2453 ChangeStatus updateImpl(Attributor &A) override { 2454 return indicatePessimisticFixpoint(); 2455 } 2456 2457 /// See AbstractAttribute::trackStatistics() 2458 void trackStatistics() const override {} 2459 }; 2460 2461 /// -------------------- Dereferenceable Argument Attribute -------------------- 2462 2463 template <> 2464 ChangeStatus clampStateAndIndicateChange<DerefState>(DerefState &S, 2465 const DerefState &R) { 2466 ChangeStatus CS0 = clampStateAndIndicateChange<IntegerState>( 2467 S.DerefBytesState, R.DerefBytesState); 2468 ChangeStatus CS1 = 2469 clampStateAndIndicateChange<IntegerState>(S.GlobalState, R.GlobalState); 2470 return CS0 | CS1; 2471 } 2472 2473 struct AADereferenceableImpl : AADereferenceable { 2474 AADereferenceableImpl(const IRPosition &IRP) : AADereferenceable(IRP) {} 2475 using StateType = DerefState; 2476 2477 void initialize(Attributor &A) override { 2478 SmallVector<Attribute, 4> Attrs; 2479 getAttrs({Attribute::Dereferenceable, Attribute::DereferenceableOrNull}, 2480 Attrs); 2481 for (const Attribute &Attr : Attrs) 2482 takeKnownDerefBytesMaximum(Attr.getValueAsInt()); 2483 2484 NonNullAA = &A.getAAFor<AANonNull>(*this, getIRPosition()); 2485 2486 const IRPosition &IRP = this->getIRPosition(); 2487 bool IsFnInterface = IRP.isFnInterfaceKind(); 2488 const Function *FnScope = IRP.getAnchorScope(); 2489 if (IsFnInterface && (!FnScope || !FnScope->hasExactDefinition())) 2490 indicatePessimisticFixpoint(); 2491 } 2492 2493 /// See AbstractAttribute::getState() 2494 /// { 2495 StateType &getState() override { return *this; } 2496 const StateType &getState() const override { return *this; } 2497 /// } 2498 2499 /// See AAFromMustBeExecutedContext 2500 bool followUse(Attributor &A, const Use *U, const Instruction *I) { 2501 bool IsNonNull = false; 2502 bool TrackUse = false; 2503 int64_t DerefBytes = getKnownNonNullAndDerefBytesForUse( 2504 A, *this, getAssociatedValue(), U, I, IsNonNull, TrackUse); 2505 takeKnownDerefBytesMaximum(DerefBytes); 2506 return TrackUse; 2507 } 2508 2509 void getDeducedAttributes(LLVMContext &Ctx, 2510 SmallVectorImpl<Attribute> &Attrs) const override { 2511 // TODO: Add *_globally support 2512 if (isAssumedNonNull()) 2513 Attrs.emplace_back(Attribute::getWithDereferenceableBytes( 2514 Ctx, getAssumedDereferenceableBytes())); 2515 else 2516 Attrs.emplace_back(Attribute::getWithDereferenceableOrNullBytes( 2517 Ctx, getAssumedDereferenceableBytes())); 2518 } 2519 2520 /// See AbstractAttribute::getAsStr(). 2521 const std::string getAsStr() const override { 2522 if (!getAssumedDereferenceableBytes()) 2523 return "unknown-dereferenceable"; 2524 return std::string("dereferenceable") + 2525 (isAssumedNonNull() ? "" : "_or_null") + 2526 (isAssumedGlobal() ? "_globally" : "") + "<" + 2527 std::to_string(getKnownDereferenceableBytes()) + "-" + 2528 std::to_string(getAssumedDereferenceableBytes()) + ">"; 2529 } 2530 }; 2531 2532 /// Dereferenceable attribute for a floating value. 2533 struct AADereferenceableFloating 2534 : AAFromMustBeExecutedContext<AADereferenceable, AADereferenceableImpl> { 2535 using Base = 2536 AAFromMustBeExecutedContext<AADereferenceable, AADereferenceableImpl>; 2537 AADereferenceableFloating(const IRPosition &IRP) : Base(IRP) {} 2538 2539 /// See AbstractAttribute::updateImpl(...). 2540 ChangeStatus updateImpl(Attributor &A) override { 2541 ChangeStatus Change = Base::updateImpl(A); 2542 2543 const DataLayout &DL = A.getDataLayout(); 2544 2545 auto VisitValueCB = [&](Value &V, DerefState &T, bool Stripped) -> bool { 2546 unsigned IdxWidth = 2547 DL.getIndexSizeInBits(V.getType()->getPointerAddressSpace()); 2548 APInt Offset(IdxWidth, 0); 2549 const Value *Base = 2550 V.stripAndAccumulateInBoundsConstantOffsets(DL, Offset); 2551 2552 const auto &AA = 2553 A.getAAFor<AADereferenceable>(*this, IRPosition::value(*Base)); 2554 int64_t DerefBytes = 0; 2555 if (!Stripped && this == &AA) { 2556 // Use IR information if we did not strip anything. 2557 // TODO: track globally. 2558 bool CanBeNull; 2559 DerefBytes = Base->getPointerDereferenceableBytes(DL, CanBeNull); 2560 T.GlobalState.indicatePessimisticFixpoint(); 2561 } else { 2562 const DerefState &DS = static_cast<const DerefState &>(AA.getState()); 2563 DerefBytes = DS.DerefBytesState.getAssumed(); 2564 T.GlobalState &= DS.GlobalState; 2565 } 2566 2567 // For now we do not try to "increase" dereferenceability due to negative 2568 // indices as we first have to come up with code to deal with loops and 2569 // for overflows of the dereferenceable bytes. 2570 int64_t OffsetSExt = Offset.getSExtValue(); 2571 if (OffsetSExt < 0) 2572 OffsetSExt = 0; 2573 2574 T.takeAssumedDerefBytesMinimum( 2575 std::max(int64_t(0), DerefBytes - OffsetSExt)); 2576 2577 if (this == &AA) { 2578 if (!Stripped) { 2579 // If nothing was stripped IR information is all we got. 2580 T.takeKnownDerefBytesMaximum( 2581 std::max(int64_t(0), DerefBytes - OffsetSExt)); 2582 T.indicatePessimisticFixpoint(); 2583 } else if (OffsetSExt > 0) { 2584 // If something was stripped but there is circular reasoning we look 2585 // for the offset. If it is positive we basically decrease the 2586 // dereferenceable bytes in a circluar loop now, which will simply 2587 // drive them down to the known value in a very slow way which we 2588 // can accelerate. 2589 T.indicatePessimisticFixpoint(); 2590 } 2591 } 2592 2593 return T.isValidState(); 2594 }; 2595 2596 DerefState T; 2597 if (!genericValueTraversal<AADereferenceable, DerefState>( 2598 A, getIRPosition(), *this, T, VisitValueCB)) 2599 return indicatePessimisticFixpoint(); 2600 2601 return Change | clampStateAndIndicateChange(getState(), T); 2602 } 2603 2604 /// See AbstractAttribute::trackStatistics() 2605 void trackStatistics() const override { 2606 STATS_DECLTRACK_FLOATING_ATTR(dereferenceable) 2607 } 2608 }; 2609 2610 /// Dereferenceable attribute for a return value. 2611 struct AADereferenceableReturned final 2612 : AAReturnedFromReturnedValues<AADereferenceable, AADereferenceableImpl, 2613 DerefState> { 2614 AADereferenceableReturned(const IRPosition &IRP) 2615 : AAReturnedFromReturnedValues<AADereferenceable, AADereferenceableImpl, 2616 DerefState>(IRP) {} 2617 2618 /// See AbstractAttribute::trackStatistics() 2619 void trackStatistics() const override { 2620 STATS_DECLTRACK_FNRET_ATTR(dereferenceable) 2621 } 2622 }; 2623 2624 /// Dereferenceable attribute for an argument 2625 struct AADereferenceableArgument final 2626 : AAArgumentFromCallSiteArgumentsAndMustBeExecutedContext< 2627 AADereferenceable, AADereferenceableImpl, DerefState> { 2628 using Base = AAArgumentFromCallSiteArgumentsAndMustBeExecutedContext< 2629 AADereferenceable, AADereferenceableImpl, DerefState>; 2630 AADereferenceableArgument(const IRPosition &IRP) : Base(IRP) {} 2631 2632 /// See AbstractAttribute::trackStatistics() 2633 void trackStatistics() const override { 2634 STATS_DECLTRACK_ARG_ATTR(dereferenceable) 2635 } 2636 }; 2637 2638 /// Dereferenceable attribute for a call site argument. 2639 struct AADereferenceableCallSiteArgument final : AADereferenceableFloating { 2640 AADereferenceableCallSiteArgument(const IRPosition &IRP) 2641 : AADereferenceableFloating(IRP) {} 2642 2643 /// See AbstractAttribute::trackStatistics() 2644 void trackStatistics() const override { 2645 STATS_DECLTRACK_CSARG_ATTR(dereferenceable) 2646 } 2647 }; 2648 2649 /// Dereferenceable attribute deduction for a call site return value. 2650 struct AADereferenceableCallSiteReturned final 2651 : AACallSiteReturnedFromReturnedAndMustBeExecutedContext< 2652 AADereferenceable, AADereferenceableImpl> { 2653 using Base = AACallSiteReturnedFromReturnedAndMustBeExecutedContext< 2654 AADereferenceable, AADereferenceableImpl>; 2655 AADereferenceableCallSiteReturned(const IRPosition &IRP) : Base(IRP) {} 2656 2657 /// See AbstractAttribute::initialize(...). 2658 void initialize(Attributor &A) override { 2659 Base::initialize(A); 2660 Function *F = getAssociatedFunction(); 2661 if (!F) 2662 indicatePessimisticFixpoint(); 2663 } 2664 2665 /// See AbstractAttribute::updateImpl(...). 2666 ChangeStatus updateImpl(Attributor &A) override { 2667 // TODO: Once we have call site specific value information we can provide 2668 // call site specific liveness information and then it makes 2669 // sense to specialize attributes for call sites arguments instead of 2670 // redirecting requests to the callee argument. 2671 2672 ChangeStatus Change = Base::updateImpl(A); 2673 Function *F = getAssociatedFunction(); 2674 const IRPosition &FnPos = IRPosition::returned(*F); 2675 auto &FnAA = A.getAAFor<AADereferenceable>(*this, FnPos); 2676 return Change | 2677 clampStateAndIndicateChange( 2678 getState(), static_cast<const DerefState &>(FnAA.getState())); 2679 } 2680 2681 /// See AbstractAttribute::trackStatistics() 2682 void trackStatistics() const override { 2683 STATS_DECLTRACK_CS_ATTR(dereferenceable); 2684 } 2685 }; 2686 2687 // ------------------------ Align Argument Attribute ------------------------ 2688 2689 struct AAAlignImpl : AAAlign { 2690 AAAlignImpl(const IRPosition &IRP) : AAAlign(IRP) {} 2691 2692 // Max alignemnt value allowed in IR 2693 static const unsigned MAX_ALIGN = 1U << 29; 2694 2695 /// See AbstractAttribute::initialize(...). 2696 void initialize(Attributor &A) override { 2697 takeAssumedMinimum(MAX_ALIGN); 2698 2699 SmallVector<Attribute, 4> Attrs; 2700 getAttrs({Attribute::Alignment}, Attrs); 2701 for (const Attribute &Attr : Attrs) 2702 takeKnownMaximum(Attr.getValueAsInt()); 2703 2704 if (getIRPosition().isFnInterfaceKind() && 2705 (!getAssociatedFunction() || 2706 !getAssociatedFunction()->hasExactDefinition())) 2707 indicatePessimisticFixpoint(); 2708 } 2709 2710 /// See AbstractAttribute::manifest(...). 2711 ChangeStatus manifest(Attributor &A) override { 2712 ChangeStatus Changed = ChangeStatus::UNCHANGED; 2713 2714 // Check for users that allow alignment annotations. 2715 Value &AnchorVal = getIRPosition().getAnchorValue(); 2716 for (const Use &U : AnchorVal.uses()) { 2717 if (auto *SI = dyn_cast<StoreInst>(U.getUser())) { 2718 if (SI->getPointerOperand() == &AnchorVal) 2719 if (SI->getAlignment() < getAssumedAlign()) { 2720 STATS_DECLTRACK(AAAlign, Store, 2721 "Number of times alignemnt added to a store"); 2722 SI->setAlignment(Align(getAssumedAlign())); 2723 Changed = ChangeStatus::CHANGED; 2724 } 2725 } else if (auto *LI = dyn_cast<LoadInst>(U.getUser())) { 2726 if (LI->getPointerOperand() == &AnchorVal) 2727 if (LI->getAlignment() < getAssumedAlign()) { 2728 LI->setAlignment(Align(getAssumedAlign())); 2729 STATS_DECLTRACK(AAAlign, Load, 2730 "Number of times alignemnt added to a load"); 2731 Changed = ChangeStatus::CHANGED; 2732 } 2733 } 2734 } 2735 2736 return AAAlign::manifest(A) | Changed; 2737 } 2738 2739 // TODO: Provide a helper to determine the implied ABI alignment and check in 2740 // the existing manifest method and a new one for AAAlignImpl that value 2741 // to avoid making the alignment explicit if it did not improve. 2742 2743 /// See AbstractAttribute::getDeducedAttributes 2744 virtual void 2745 getDeducedAttributes(LLVMContext &Ctx, 2746 SmallVectorImpl<Attribute> &Attrs) const override { 2747 if (getAssumedAlign() > 1) 2748 Attrs.emplace_back( 2749 Attribute::getWithAlignment(Ctx, Align(getAssumedAlign()))); 2750 } 2751 2752 /// See AbstractAttribute::getAsStr(). 2753 const std::string getAsStr() const override { 2754 return getAssumedAlign() ? ("align<" + std::to_string(getKnownAlign()) + 2755 "-" + std::to_string(getAssumedAlign()) + ">") 2756 : "unknown-align"; 2757 } 2758 }; 2759 2760 /// Align attribute for a floating value. 2761 struct AAAlignFloating : AAAlignImpl { 2762 AAAlignFloating(const IRPosition &IRP) : AAAlignImpl(IRP) {} 2763 2764 /// See AbstractAttribute::updateImpl(...). 2765 ChangeStatus updateImpl(Attributor &A) override { 2766 const DataLayout &DL = A.getDataLayout(); 2767 2768 auto VisitValueCB = [&](Value &V, AAAlign::StateType &T, 2769 bool Stripped) -> bool { 2770 const auto &AA = A.getAAFor<AAAlign>(*this, IRPosition::value(V)); 2771 if (!Stripped && this == &AA) { 2772 // Use only IR information if we did not strip anything. 2773 const MaybeAlign PA = V.getPointerAlignment(DL); 2774 T.takeKnownMaximum(PA ? PA->value() : 0); 2775 T.indicatePessimisticFixpoint(); 2776 } else { 2777 // Use abstract attribute information. 2778 const AAAlign::StateType &DS = 2779 static_cast<const AAAlign::StateType &>(AA.getState()); 2780 T ^= DS; 2781 } 2782 return T.isValidState(); 2783 }; 2784 2785 StateType T; 2786 if (!genericValueTraversal<AAAlign, StateType>(A, getIRPosition(), *this, T, 2787 VisitValueCB)) 2788 return indicatePessimisticFixpoint(); 2789 2790 // TODO: If we know we visited all incoming values, thus no are assumed 2791 // dead, we can take the known information from the state T. 2792 return clampStateAndIndicateChange(getState(), T); 2793 } 2794 2795 /// See AbstractAttribute::trackStatistics() 2796 void trackStatistics() const override { STATS_DECLTRACK_FLOATING_ATTR(align) } 2797 }; 2798 2799 /// Align attribute for function return value. 2800 struct AAAlignReturned final 2801 : AAReturnedFromReturnedValues<AAAlign, AAAlignImpl> { 2802 AAAlignReturned(const IRPosition &IRP) 2803 : AAReturnedFromReturnedValues<AAAlign, AAAlignImpl>(IRP) {} 2804 2805 /// See AbstractAttribute::trackStatistics() 2806 void trackStatistics() const override { STATS_DECLTRACK_FNRET_ATTR(aligned) } 2807 }; 2808 2809 /// Align attribute for function argument. 2810 struct AAAlignArgument final 2811 : AAArgumentFromCallSiteArguments<AAAlign, AAAlignImpl> { 2812 AAAlignArgument(const IRPosition &IRP) 2813 : AAArgumentFromCallSiteArguments<AAAlign, AAAlignImpl>(IRP) {} 2814 2815 /// See AbstractAttribute::trackStatistics() 2816 void trackStatistics() const override { STATS_DECLTRACK_ARG_ATTR(aligned) } 2817 }; 2818 2819 struct AAAlignCallSiteArgument final : AAAlignFloating { 2820 AAAlignCallSiteArgument(const IRPosition &IRP) : AAAlignFloating(IRP) {} 2821 2822 /// See AbstractAttribute::manifest(...). 2823 ChangeStatus manifest(Attributor &A) override { 2824 return AAAlignImpl::manifest(A); 2825 } 2826 2827 /// See AbstractAttribute::trackStatistics() 2828 void trackStatistics() const override { STATS_DECLTRACK_CSARG_ATTR(aligned) } 2829 }; 2830 2831 /// Align attribute deduction for a call site return value. 2832 struct AAAlignCallSiteReturned final : AAAlignImpl { 2833 AAAlignCallSiteReturned(const IRPosition &IRP) : AAAlignImpl(IRP) {} 2834 2835 /// See AbstractAttribute::initialize(...). 2836 void initialize(Attributor &A) override { 2837 AAAlignImpl::initialize(A); 2838 Function *F = getAssociatedFunction(); 2839 if (!F) 2840 indicatePessimisticFixpoint(); 2841 } 2842 2843 /// See AbstractAttribute::updateImpl(...). 2844 ChangeStatus updateImpl(Attributor &A) override { 2845 // TODO: Once we have call site specific value information we can provide 2846 // call site specific liveness information and then it makes 2847 // sense to specialize attributes for call sites arguments instead of 2848 // redirecting requests to the callee argument. 2849 Function *F = getAssociatedFunction(); 2850 const IRPosition &FnPos = IRPosition::returned(*F); 2851 auto &FnAA = A.getAAFor<AAAlign>(*this, FnPos); 2852 return clampStateAndIndicateChange( 2853 getState(), static_cast<const AAAlign::StateType &>(FnAA.getState())); 2854 } 2855 2856 /// See AbstractAttribute::trackStatistics() 2857 void trackStatistics() const override { STATS_DECLTRACK_CS_ATTR(align); } 2858 }; 2859 2860 /// ------------------ Function No-Return Attribute ---------------------------- 2861 struct AANoReturnImpl : public AANoReturn { 2862 AANoReturnImpl(const IRPosition &IRP) : AANoReturn(IRP) {} 2863 2864 /// See AbstractAttribute::initialize(...). 2865 void initialize(Attributor &A) override { 2866 AANoReturn::initialize(A); 2867 Function *F = getAssociatedFunction(); 2868 if (!F || F->hasFnAttribute(Attribute::WillReturn)) 2869 indicatePessimisticFixpoint(); 2870 } 2871 2872 /// See AbstractAttribute::getAsStr(). 2873 const std::string getAsStr() const override { 2874 return getAssumed() ? "noreturn" : "may-return"; 2875 } 2876 2877 /// See AbstractAttribute::updateImpl(Attributor &A). 2878 virtual ChangeStatus updateImpl(Attributor &A) override { 2879 const auto &WillReturnAA = A.getAAFor<AAWillReturn>(*this, getIRPosition()); 2880 if (WillReturnAA.isKnownWillReturn()) 2881 return indicatePessimisticFixpoint(); 2882 auto CheckForNoReturn = [](Instruction &) { return false; }; 2883 if (!A.checkForAllInstructions(CheckForNoReturn, *this, 2884 {(unsigned)Instruction::Ret})) 2885 return indicatePessimisticFixpoint(); 2886 return ChangeStatus::UNCHANGED; 2887 } 2888 }; 2889 2890 struct AANoReturnFunction final : AANoReturnImpl { 2891 AANoReturnFunction(const IRPosition &IRP) : AANoReturnImpl(IRP) {} 2892 2893 /// See AbstractAttribute::trackStatistics() 2894 void trackStatistics() const override { STATS_DECLTRACK_FN_ATTR(noreturn) } 2895 }; 2896 2897 /// NoReturn attribute deduction for a call sites. 2898 struct AANoReturnCallSite final : AANoReturnImpl { 2899 AANoReturnCallSite(const IRPosition &IRP) : AANoReturnImpl(IRP) {} 2900 2901 /// See AbstractAttribute::updateImpl(...). 2902 ChangeStatus updateImpl(Attributor &A) override { 2903 // TODO: Once we have call site specific value information we can provide 2904 // call site specific liveness information and then it makes 2905 // sense to specialize attributes for call sites arguments instead of 2906 // redirecting requests to the callee argument. 2907 Function *F = getAssociatedFunction(); 2908 const IRPosition &FnPos = IRPosition::function(*F); 2909 auto &FnAA = A.getAAFor<AANoReturn>(*this, FnPos); 2910 return clampStateAndIndicateChange( 2911 getState(), 2912 static_cast<const AANoReturn::StateType &>(FnAA.getState())); 2913 } 2914 2915 /// See AbstractAttribute::trackStatistics() 2916 void trackStatistics() const override { STATS_DECLTRACK_CS_ATTR(noreturn); } 2917 }; 2918 2919 /// ----------------------- Variable Capturing --------------------------------- 2920 2921 /// A class to hold the state of for no-capture attributes. 2922 struct AANoCaptureImpl : public AANoCapture { 2923 AANoCaptureImpl(const IRPosition &IRP) : AANoCapture(IRP) {} 2924 2925 /// See AbstractAttribute::initialize(...). 2926 void initialize(Attributor &A) override { 2927 AANoCapture::initialize(A); 2928 2929 // You cannot "capture" null in the default address space. 2930 if (isa<ConstantPointerNull>(getAssociatedValue()) && 2931 getAssociatedValue().getType()->getPointerAddressSpace() == 0) { 2932 indicateOptimisticFixpoint(); 2933 return; 2934 } 2935 2936 const IRPosition &IRP = getIRPosition(); 2937 const Function *F = 2938 getArgNo() >= 0 ? IRP.getAssociatedFunction() : IRP.getAnchorScope(); 2939 2940 // Check what state the associated function can actually capture. 2941 if (F) 2942 determineFunctionCaptureCapabilities(*F, *this); 2943 else 2944 indicatePessimisticFixpoint(); 2945 } 2946 2947 /// See AbstractAttribute::updateImpl(...). 2948 ChangeStatus updateImpl(Attributor &A) override; 2949 2950 /// see AbstractAttribute::isAssumedNoCaptureMaybeReturned(...). 2951 virtual void 2952 getDeducedAttributes(LLVMContext &Ctx, 2953 SmallVectorImpl<Attribute> &Attrs) const override { 2954 if (!isAssumedNoCaptureMaybeReturned()) 2955 return; 2956 2957 if (getArgNo() >= 0) { 2958 if (isAssumedNoCapture()) 2959 Attrs.emplace_back(Attribute::get(Ctx, Attribute::NoCapture)); 2960 else if (ManifestInternal) 2961 Attrs.emplace_back(Attribute::get(Ctx, "no-capture-maybe-returned")); 2962 } 2963 } 2964 2965 /// Set the NOT_CAPTURED_IN_MEM and NOT_CAPTURED_IN_RET bits in \p Known 2966 /// depending on the ability of the function associated with \p IRP to capture 2967 /// state in memory and through "returning/throwing", respectively. 2968 static void determineFunctionCaptureCapabilities(const Function &F, 2969 IntegerState &State) { 2970 // TODO: Once we have memory behavior attributes we should use them here. 2971 2972 // If we know we cannot communicate or write to memory, we do not care about 2973 // ptr2int anymore. 2974 if (F.onlyReadsMemory() && F.doesNotThrow() && 2975 F.getReturnType()->isVoidTy()) { 2976 State.addKnownBits(NO_CAPTURE); 2977 return; 2978 } 2979 2980 // A function cannot capture state in memory if it only reads memory, it can 2981 // however return/throw state and the state might be influenced by the 2982 // pointer value, e.g., loading from a returned pointer might reveal a bit. 2983 if (F.onlyReadsMemory()) 2984 State.addKnownBits(NOT_CAPTURED_IN_MEM); 2985 2986 // A function cannot communicate state back if it does not through 2987 // exceptions and doesn not return values. 2988 if (F.doesNotThrow() && F.getReturnType()->isVoidTy()) 2989 State.addKnownBits(NOT_CAPTURED_IN_RET); 2990 } 2991 2992 /// See AbstractState::getAsStr(). 2993 const std::string getAsStr() const override { 2994 if (isKnownNoCapture()) 2995 return "known not-captured"; 2996 if (isAssumedNoCapture()) 2997 return "assumed not-captured"; 2998 if (isKnownNoCaptureMaybeReturned()) 2999 return "known not-captured-maybe-returned"; 3000 if (isAssumedNoCaptureMaybeReturned()) 3001 return "assumed not-captured-maybe-returned"; 3002 return "assumed-captured"; 3003 } 3004 }; 3005 3006 /// Attributor-aware capture tracker. 3007 struct AACaptureUseTracker final : public CaptureTracker { 3008 3009 /// Create a capture tracker that can lookup in-flight abstract attributes 3010 /// through the Attributor \p A. 3011 /// 3012 /// If a use leads to a potential capture, \p CapturedInMemory is set and the 3013 /// search is stopped. If a use leads to a return instruction, 3014 /// \p CommunicatedBack is set to true and \p CapturedInMemory is not changed. 3015 /// If a use leads to a ptr2int which may capture the value, 3016 /// \p CapturedInInteger is set. If a use is found that is currently assumed 3017 /// "no-capture-maybe-returned", the user is added to the \p PotentialCopies 3018 /// set. All values in \p PotentialCopies are later tracked as well. For every 3019 /// explored use we decrement \p RemainingUsesToExplore. Once it reaches 0, 3020 /// the search is stopped with \p CapturedInMemory and \p CapturedInInteger 3021 /// conservatively set to true. 3022 AACaptureUseTracker(Attributor &A, AANoCapture &NoCaptureAA, 3023 const AAIsDead &IsDeadAA, IntegerState &State, 3024 SmallVectorImpl<const Value *> &PotentialCopies, 3025 unsigned &RemainingUsesToExplore) 3026 : A(A), NoCaptureAA(NoCaptureAA), IsDeadAA(IsDeadAA), State(State), 3027 PotentialCopies(PotentialCopies), 3028 RemainingUsesToExplore(RemainingUsesToExplore) {} 3029 3030 /// Determine if \p V maybe captured. *Also updates the state!* 3031 bool valueMayBeCaptured(const Value *V) { 3032 if (V->getType()->isPointerTy()) { 3033 PointerMayBeCaptured(V, this); 3034 } else { 3035 State.indicatePessimisticFixpoint(); 3036 } 3037 return State.isAssumed(AANoCapture::NO_CAPTURE_MAYBE_RETURNED); 3038 } 3039 3040 /// See CaptureTracker::tooManyUses(). 3041 void tooManyUses() override { 3042 State.removeAssumedBits(AANoCapture::NO_CAPTURE); 3043 } 3044 3045 bool isDereferenceableOrNull(Value *O, const DataLayout &DL) override { 3046 if (CaptureTracker::isDereferenceableOrNull(O, DL)) 3047 return true; 3048 const auto &DerefAA = 3049 A.getAAFor<AADereferenceable>(NoCaptureAA, IRPosition::value(*O)); 3050 return DerefAA.getAssumedDereferenceableBytes(); 3051 } 3052 3053 /// See CaptureTracker::captured(...). 3054 bool captured(const Use *U) override { 3055 Instruction *UInst = cast<Instruction>(U->getUser()); 3056 LLVM_DEBUG(dbgs() << "Check use: " << *U->get() << " in " << *UInst 3057 << "\n"); 3058 3059 // Because we may reuse the tracker multiple times we keep track of the 3060 // number of explored uses ourselves as well. 3061 if (RemainingUsesToExplore-- == 0) { 3062 LLVM_DEBUG(dbgs() << " - too many uses to explore!\n"); 3063 return isCapturedIn(/* Memory */ true, /* Integer */ true, 3064 /* Return */ true); 3065 } 3066 3067 // Deal with ptr2int by following uses. 3068 if (isa<PtrToIntInst>(UInst)) { 3069 LLVM_DEBUG(dbgs() << " - ptr2int assume the worst!\n"); 3070 return valueMayBeCaptured(UInst); 3071 } 3072 3073 // Explicitly catch return instructions. 3074 if (isa<ReturnInst>(UInst)) 3075 return isCapturedIn(/* Memory */ false, /* Integer */ false, 3076 /* Return */ true); 3077 3078 // For now we only use special logic for call sites. However, the tracker 3079 // itself knows about a lot of other non-capturing cases already. 3080 CallSite CS(UInst); 3081 if (!CS || !CS.isArgOperand(U)) 3082 return isCapturedIn(/* Memory */ true, /* Integer */ true, 3083 /* Return */ true); 3084 3085 unsigned ArgNo = CS.getArgumentNo(U); 3086 const IRPosition &CSArgPos = IRPosition::callsite_argument(CS, ArgNo); 3087 // If we have a abstract no-capture attribute for the argument we can use 3088 // it to justify a non-capture attribute here. This allows recursion! 3089 auto &ArgNoCaptureAA = A.getAAFor<AANoCapture>(NoCaptureAA, CSArgPos); 3090 if (ArgNoCaptureAA.isAssumedNoCapture()) 3091 return isCapturedIn(/* Memory */ false, /* Integer */ false, 3092 /* Return */ false); 3093 if (ArgNoCaptureAA.isAssumedNoCaptureMaybeReturned()) { 3094 addPotentialCopy(CS); 3095 return isCapturedIn(/* Memory */ false, /* Integer */ false, 3096 /* Return */ false); 3097 } 3098 3099 // Lastly, we could not find a reason no-capture can be assumed so we don't. 3100 return isCapturedIn(/* Memory */ true, /* Integer */ true, 3101 /* Return */ true); 3102 } 3103 3104 /// Register \p CS as potential copy of the value we are checking. 3105 void addPotentialCopy(CallSite CS) { 3106 PotentialCopies.push_back(CS.getInstruction()); 3107 } 3108 3109 /// See CaptureTracker::shouldExplore(...). 3110 bool shouldExplore(const Use *U) override { 3111 // Check liveness. 3112 return !IsDeadAA.isAssumedDead(cast<Instruction>(U->getUser())); 3113 } 3114 3115 /// Update the state according to \p CapturedInMem, \p CapturedInInt, and 3116 /// \p CapturedInRet, then return the appropriate value for use in the 3117 /// CaptureTracker::captured() interface. 3118 bool isCapturedIn(bool CapturedInMem, bool CapturedInInt, 3119 bool CapturedInRet) { 3120 LLVM_DEBUG(dbgs() << " - captures [Mem " << CapturedInMem << "|Int " 3121 << CapturedInInt << "|Ret " << CapturedInRet << "]\n"); 3122 if (CapturedInMem) 3123 State.removeAssumedBits(AANoCapture::NOT_CAPTURED_IN_MEM); 3124 if (CapturedInInt) 3125 State.removeAssumedBits(AANoCapture::NOT_CAPTURED_IN_INT); 3126 if (CapturedInRet) 3127 State.removeAssumedBits(AANoCapture::NOT_CAPTURED_IN_RET); 3128 return !State.isAssumed(AANoCapture::NO_CAPTURE_MAYBE_RETURNED); 3129 } 3130 3131 private: 3132 /// The attributor providing in-flight abstract attributes. 3133 Attributor &A; 3134 3135 /// The abstract attribute currently updated. 3136 AANoCapture &NoCaptureAA; 3137 3138 /// The abstract liveness state. 3139 const AAIsDead &IsDeadAA; 3140 3141 /// The state currently updated. 3142 IntegerState &State; 3143 3144 /// Set of potential copies of the tracked value. 3145 SmallVectorImpl<const Value *> &PotentialCopies; 3146 3147 /// Global counter to limit the number of explored uses. 3148 unsigned &RemainingUsesToExplore; 3149 }; 3150 3151 ChangeStatus AANoCaptureImpl::updateImpl(Attributor &A) { 3152 const IRPosition &IRP = getIRPosition(); 3153 const Value *V = 3154 getArgNo() >= 0 ? IRP.getAssociatedArgument() : &IRP.getAssociatedValue(); 3155 if (!V) 3156 return indicatePessimisticFixpoint(); 3157 3158 const Function *F = 3159 getArgNo() >= 0 ? IRP.getAssociatedFunction() : IRP.getAnchorScope(); 3160 assert(F && "Expected a function!"); 3161 const auto &IsDeadAA = A.getAAFor<AAIsDead>(*this, IRPosition::function(*F)); 3162 3163 AANoCapture::StateType T; 3164 // TODO: Once we have memory behavior attributes we should use them here 3165 // similar to the reasoning in 3166 // AANoCaptureImpl::determineFunctionCaptureCapabilities(...). 3167 3168 // TODO: Use the AAReturnedValues to learn if the argument can return or 3169 // not. 3170 3171 // Use the CaptureTracker interface and logic with the specialized tracker, 3172 // defined in AACaptureUseTracker, that can look at in-flight abstract 3173 // attributes and directly updates the assumed state. 3174 SmallVector<const Value *, 4> PotentialCopies; 3175 unsigned RemainingUsesToExplore = DefaultMaxUsesToExplore; 3176 AACaptureUseTracker Tracker(A, *this, IsDeadAA, T, PotentialCopies, 3177 RemainingUsesToExplore); 3178 3179 // Check all potential copies of the associated value until we can assume 3180 // none will be captured or we have to assume at least one might be. 3181 unsigned Idx = 0; 3182 PotentialCopies.push_back(V); 3183 while (T.isAssumed(NO_CAPTURE_MAYBE_RETURNED) && Idx < PotentialCopies.size()) 3184 Tracker.valueMayBeCaptured(PotentialCopies[Idx++]); 3185 3186 AAAlign::StateType &S = getState(); 3187 auto Assumed = S.getAssumed(); 3188 S.intersectAssumedBits(T.getAssumed()); 3189 return Assumed == S.getAssumed() ? ChangeStatus::UNCHANGED 3190 : ChangeStatus::CHANGED; 3191 } 3192 3193 /// NoCapture attribute for function arguments. 3194 struct AANoCaptureArgument final : AANoCaptureImpl { 3195 AANoCaptureArgument(const IRPosition &IRP) : AANoCaptureImpl(IRP) {} 3196 3197 /// See AbstractAttribute::trackStatistics() 3198 void trackStatistics() const override { STATS_DECLTRACK_ARG_ATTR(nocapture) } 3199 }; 3200 3201 /// NoCapture attribute for call site arguments. 3202 struct AANoCaptureCallSiteArgument final : AANoCaptureImpl { 3203 AANoCaptureCallSiteArgument(const IRPosition &IRP) : AANoCaptureImpl(IRP) {} 3204 3205 /// See AbstractAttribute::updateImpl(...). 3206 ChangeStatus updateImpl(Attributor &A) override { 3207 // TODO: Once we have call site specific value information we can provide 3208 // call site specific liveness information and then it makes 3209 // sense to specialize attributes for call sites arguments instead of 3210 // redirecting requests to the callee argument. 3211 Argument *Arg = getAssociatedArgument(); 3212 if (!Arg) 3213 return indicatePessimisticFixpoint(); 3214 const IRPosition &ArgPos = IRPosition::argument(*Arg); 3215 auto &ArgAA = A.getAAFor<AANoCapture>(*this, ArgPos); 3216 return clampStateAndIndicateChange( 3217 getState(), 3218 static_cast<const AANoCapture::StateType &>(ArgAA.getState())); 3219 } 3220 3221 /// See AbstractAttribute::trackStatistics() 3222 void trackStatistics() const override{STATS_DECLTRACK_CSARG_ATTR(nocapture)}; 3223 }; 3224 3225 /// NoCapture attribute for floating values. 3226 struct AANoCaptureFloating final : AANoCaptureImpl { 3227 AANoCaptureFloating(const IRPosition &IRP) : AANoCaptureImpl(IRP) {} 3228 3229 /// See AbstractAttribute::trackStatistics() 3230 void trackStatistics() const override { 3231 STATS_DECLTRACK_FLOATING_ATTR(nocapture) 3232 } 3233 }; 3234 3235 /// NoCapture attribute for function return value. 3236 struct AANoCaptureReturned final : AANoCaptureImpl { 3237 AANoCaptureReturned(const IRPosition &IRP) : AANoCaptureImpl(IRP) { 3238 llvm_unreachable("NoCapture is not applicable to function returns!"); 3239 } 3240 3241 /// See AbstractAttribute::initialize(...). 3242 void initialize(Attributor &A) override { 3243 llvm_unreachable("NoCapture is not applicable to function returns!"); 3244 } 3245 3246 /// See AbstractAttribute::updateImpl(...). 3247 ChangeStatus updateImpl(Attributor &A) override { 3248 llvm_unreachable("NoCapture is not applicable to function returns!"); 3249 } 3250 3251 /// See AbstractAttribute::trackStatistics() 3252 void trackStatistics() const override {} 3253 }; 3254 3255 /// NoCapture attribute deduction for a call site return value. 3256 struct AANoCaptureCallSiteReturned final : AANoCaptureImpl { 3257 AANoCaptureCallSiteReturned(const IRPosition &IRP) : AANoCaptureImpl(IRP) {} 3258 3259 /// See AbstractAttribute::trackStatistics() 3260 void trackStatistics() const override { 3261 STATS_DECLTRACK_CSRET_ATTR(nocapture) 3262 } 3263 }; 3264 3265 /// ------------------ Value Simplify Attribute ---------------------------- 3266 struct AAValueSimplifyImpl : AAValueSimplify { 3267 AAValueSimplifyImpl(const IRPosition &IRP) : AAValueSimplify(IRP) {} 3268 3269 /// See AbstractAttribute::getAsStr(). 3270 const std::string getAsStr() const override { 3271 return getAssumed() ? (getKnown() ? "simplified" : "maybe-simple") 3272 : "not-simple"; 3273 } 3274 3275 /// See AbstractAttribute::trackStatistics() 3276 void trackStatistics() const override {} 3277 3278 /// See AAValueSimplify::getAssumedSimplifiedValue() 3279 Optional<Value *> getAssumedSimplifiedValue(Attributor &A) const override { 3280 if (!getAssumed()) 3281 return const_cast<Value *>(&getAssociatedValue()); 3282 return SimplifiedAssociatedValue; 3283 } 3284 void initialize(Attributor &A) override {} 3285 3286 /// Helper function for querying AAValueSimplify and updating candicate. 3287 /// \param QueryingValue Value trying to unify with SimplifiedValue 3288 /// \param AccumulatedSimplifiedValue Current simplification result. 3289 static bool checkAndUpdate(Attributor &A, const AbstractAttribute &QueryingAA, 3290 Value &QueryingValue, 3291 Optional<Value *> &AccumulatedSimplifiedValue) { 3292 // FIXME: Add a typecast support. 3293 3294 auto &ValueSimpifyAA = A.getAAFor<AAValueSimplify>( 3295 QueryingAA, IRPosition::value(QueryingValue)); 3296 3297 Optional<Value *> QueryingValueSimplified = 3298 ValueSimpifyAA.getAssumedSimplifiedValue(A); 3299 3300 if (!QueryingValueSimplified.hasValue()) 3301 return true; 3302 3303 if (!QueryingValueSimplified.getValue()) 3304 return false; 3305 3306 Value &QueryingValueSimplifiedUnwrapped = 3307 *QueryingValueSimplified.getValue(); 3308 3309 if (isa<UndefValue>(QueryingValueSimplifiedUnwrapped)) 3310 return true; 3311 3312 if (AccumulatedSimplifiedValue.hasValue()) 3313 return AccumulatedSimplifiedValue == QueryingValueSimplified; 3314 3315 LLVM_DEBUG(dbgs() << "[Attributor][ValueSimplify] " << QueryingValue 3316 << " is assumed to be " 3317 << QueryingValueSimplifiedUnwrapped << "\n"); 3318 3319 AccumulatedSimplifiedValue = QueryingValueSimplified; 3320 return true; 3321 } 3322 3323 /// See AbstractAttribute::manifest(...). 3324 ChangeStatus manifest(Attributor &A) override { 3325 ChangeStatus Changed = ChangeStatus::UNCHANGED; 3326 3327 if (!SimplifiedAssociatedValue.hasValue() || 3328 !SimplifiedAssociatedValue.getValue()) 3329 return Changed; 3330 3331 if (auto *C = dyn_cast<Constant>(SimplifiedAssociatedValue.getValue())) { 3332 // We can replace the AssociatedValue with the constant. 3333 Value &V = getAssociatedValue(); 3334 if (!V.user_empty() && &V != C && V.getType() == C->getType()) { 3335 LLVM_DEBUG(dbgs() << "[Attributor][ValueSimplify] " << V << " -> " << *C 3336 << "\n"); 3337 V.replaceAllUsesWith(C); 3338 Changed = ChangeStatus::CHANGED; 3339 } 3340 } 3341 3342 return Changed | AAValueSimplify::manifest(A); 3343 } 3344 3345 protected: 3346 // An assumed simplified value. Initially, it is set to Optional::None, which 3347 // means that the value is not clear under current assumption. If in the 3348 // pessimistic state, getAssumedSimplifiedValue doesn't return this value but 3349 // returns orignal associated value. 3350 Optional<Value *> SimplifiedAssociatedValue; 3351 }; 3352 3353 struct AAValueSimplifyArgument final : AAValueSimplifyImpl { 3354 AAValueSimplifyArgument(const IRPosition &IRP) : AAValueSimplifyImpl(IRP) {} 3355 3356 /// See AbstractAttribute::updateImpl(...). 3357 ChangeStatus updateImpl(Attributor &A) override { 3358 bool HasValueBefore = SimplifiedAssociatedValue.hasValue(); 3359 3360 auto PredForCallSite = [&](AbstractCallSite ACS) { 3361 // Check if we have an associated argument or not (which can happen for 3362 // callback calls). 3363 if (Value *ArgOp = ACS.getCallArgOperand(getArgNo())) 3364 return checkAndUpdate(A, *this, *ArgOp, SimplifiedAssociatedValue); 3365 return false; 3366 }; 3367 3368 if (!A.checkForAllCallSites(PredForCallSite, *this, true)) 3369 return indicatePessimisticFixpoint(); 3370 3371 // If a candicate was found in this update, return CHANGED. 3372 return HasValueBefore == SimplifiedAssociatedValue.hasValue() 3373 ? ChangeStatus::UNCHANGED 3374 : ChangeStatus ::CHANGED; 3375 } 3376 3377 /// See AbstractAttribute::trackStatistics() 3378 void trackStatistics() const override { 3379 STATS_DECLTRACK_ARG_ATTR(value_simplify) 3380 } 3381 }; 3382 3383 struct AAValueSimplifyReturned : AAValueSimplifyImpl { 3384 AAValueSimplifyReturned(const IRPosition &IRP) : AAValueSimplifyImpl(IRP) {} 3385 3386 /// See AbstractAttribute::updateImpl(...). 3387 ChangeStatus updateImpl(Attributor &A) override { 3388 bool HasValueBefore = SimplifiedAssociatedValue.hasValue(); 3389 3390 auto PredForReturned = [&](Value &V) { 3391 return checkAndUpdate(A, *this, V, SimplifiedAssociatedValue); 3392 }; 3393 3394 if (!A.checkForAllReturnedValues(PredForReturned, *this)) 3395 return indicatePessimisticFixpoint(); 3396 3397 // If a candicate was found in this update, return CHANGED. 3398 return HasValueBefore == SimplifiedAssociatedValue.hasValue() 3399 ? ChangeStatus::UNCHANGED 3400 : ChangeStatus ::CHANGED; 3401 } 3402 /// See AbstractAttribute::trackStatistics() 3403 void trackStatistics() const override { 3404 STATS_DECLTRACK_FNRET_ATTR(value_simplify) 3405 } 3406 }; 3407 3408 struct AAValueSimplifyFloating : AAValueSimplifyImpl { 3409 AAValueSimplifyFloating(const IRPosition &IRP) : AAValueSimplifyImpl(IRP) {} 3410 3411 /// See AbstractAttribute::initialize(...). 3412 void initialize(Attributor &A) override { 3413 Value &V = getAnchorValue(); 3414 3415 // TODO: add other stuffs 3416 if (isa<Constant>(V) || isa<UndefValue>(V)) 3417 indicatePessimisticFixpoint(); 3418 } 3419 3420 /// See AbstractAttribute::updateImpl(...). 3421 ChangeStatus updateImpl(Attributor &A) override { 3422 bool HasValueBefore = SimplifiedAssociatedValue.hasValue(); 3423 3424 auto VisitValueCB = [&](Value &V, BooleanState, bool Stripped) -> bool { 3425 auto &AA = A.getAAFor<AAValueSimplify>(*this, IRPosition::value(V)); 3426 if (!Stripped && this == &AA) { 3427 // TODO: Look the instruction and check recursively. 3428 LLVM_DEBUG( 3429 dbgs() << "[Attributor][ValueSimplify] Can't be stripped more : " 3430 << V << "\n"); 3431 indicatePessimisticFixpoint(); 3432 return false; 3433 } 3434 return checkAndUpdate(A, *this, V, SimplifiedAssociatedValue); 3435 }; 3436 3437 if (!genericValueTraversal<AAValueSimplify, BooleanState>( 3438 A, getIRPosition(), *this, static_cast<BooleanState &>(*this), 3439 VisitValueCB)) 3440 return indicatePessimisticFixpoint(); 3441 3442 // If a candicate was found in this update, return CHANGED. 3443 3444 return HasValueBefore == SimplifiedAssociatedValue.hasValue() 3445 ? ChangeStatus::UNCHANGED 3446 : ChangeStatus ::CHANGED; 3447 } 3448 3449 /// See AbstractAttribute::trackStatistics() 3450 void trackStatistics() const override { 3451 STATS_DECLTRACK_FLOATING_ATTR(value_simplify) 3452 } 3453 }; 3454 3455 struct AAValueSimplifyFunction : AAValueSimplifyImpl { 3456 AAValueSimplifyFunction(const IRPosition &IRP) : AAValueSimplifyImpl(IRP) {} 3457 3458 /// See AbstractAttribute::initialize(...). 3459 void initialize(Attributor &A) override { 3460 SimplifiedAssociatedValue = &getAnchorValue(); 3461 indicateOptimisticFixpoint(); 3462 } 3463 /// See AbstractAttribute::initialize(...). 3464 ChangeStatus updateImpl(Attributor &A) override { 3465 llvm_unreachable( 3466 "AAValueSimplify(Function|CallSite)::updateImpl will not be called"); 3467 } 3468 /// See AbstractAttribute::trackStatistics() 3469 void trackStatistics() const override { 3470 STATS_DECLTRACK_FN_ATTR(value_simplify) 3471 } 3472 }; 3473 3474 struct AAValueSimplifyCallSite : AAValueSimplifyFunction { 3475 AAValueSimplifyCallSite(const IRPosition &IRP) 3476 : AAValueSimplifyFunction(IRP) {} 3477 /// See AbstractAttribute::trackStatistics() 3478 void trackStatistics() const override { 3479 STATS_DECLTRACK_CS_ATTR(value_simplify) 3480 } 3481 }; 3482 3483 struct AAValueSimplifyCallSiteReturned : AAValueSimplifyReturned { 3484 AAValueSimplifyCallSiteReturned(const IRPosition &IRP) 3485 : AAValueSimplifyReturned(IRP) {} 3486 3487 void trackStatistics() const override { 3488 STATS_DECLTRACK_CSRET_ATTR(value_simplify) 3489 } 3490 }; 3491 struct AAValueSimplifyCallSiteArgument : AAValueSimplifyFloating { 3492 AAValueSimplifyCallSiteArgument(const IRPosition &IRP) 3493 : AAValueSimplifyFloating(IRP) {} 3494 3495 void trackStatistics() const override { 3496 STATS_DECLTRACK_CSARG_ATTR(value_simplify) 3497 } 3498 }; 3499 3500 /// ----------------------- Heap-To-Stack Conversion --------------------------- 3501 struct AAHeapToStackImpl : public AAHeapToStack { 3502 AAHeapToStackImpl(const IRPosition &IRP) : AAHeapToStack(IRP) {} 3503 3504 const std::string getAsStr() const override { 3505 return "[H2S] Mallocs: " + std::to_string(MallocCalls.size()); 3506 } 3507 3508 ChangeStatus manifest(Attributor &A) override { 3509 assert(getState().isValidState() && 3510 "Attempted to manifest an invalid state!"); 3511 3512 ChangeStatus HasChanged = ChangeStatus::UNCHANGED; 3513 Function *F = getAssociatedFunction(); 3514 const auto *TLI = A.getInfoCache().getTargetLibraryInfoForFunction(*F); 3515 3516 for (Instruction *MallocCall : MallocCalls) { 3517 // This malloc cannot be replaced. 3518 if (BadMallocCalls.count(MallocCall)) 3519 continue; 3520 3521 for (Instruction *FreeCall : FreesForMalloc[MallocCall]) { 3522 LLVM_DEBUG(dbgs() << "H2S: Removing free call: " << *FreeCall << "\n"); 3523 A.deleteAfterManifest(*FreeCall); 3524 HasChanged = ChangeStatus::CHANGED; 3525 } 3526 3527 LLVM_DEBUG(dbgs() << "H2S: Removing malloc call: " << *MallocCall 3528 << "\n"); 3529 3530 Constant *Size; 3531 if (isCallocLikeFn(MallocCall, TLI)) { 3532 auto *Num = cast<ConstantInt>(MallocCall->getOperand(0)); 3533 auto *SizeT = dyn_cast<ConstantInt>(MallocCall->getOperand(1)); 3534 APInt TotalSize = SizeT->getValue() * Num->getValue(); 3535 Size = 3536 ConstantInt::get(MallocCall->getOperand(0)->getType(), TotalSize); 3537 } else { 3538 Size = cast<ConstantInt>(MallocCall->getOperand(0)); 3539 } 3540 3541 unsigned AS = cast<PointerType>(MallocCall->getType())->getAddressSpace(); 3542 Instruction *AI = new AllocaInst(Type::getInt8Ty(F->getContext()), AS, 3543 Size, "", MallocCall->getNextNode()); 3544 3545 if (AI->getType() != MallocCall->getType()) 3546 AI = new BitCastInst(AI, MallocCall->getType(), "malloc_bc", 3547 AI->getNextNode()); 3548 3549 MallocCall->replaceAllUsesWith(AI); 3550 3551 if (auto *II = dyn_cast<InvokeInst>(MallocCall)) { 3552 auto *NBB = II->getNormalDest(); 3553 BranchInst::Create(NBB, MallocCall->getParent()); 3554 A.deleteAfterManifest(*MallocCall); 3555 } else { 3556 A.deleteAfterManifest(*MallocCall); 3557 } 3558 3559 if (isCallocLikeFn(MallocCall, TLI)) { 3560 auto *BI = new BitCastInst(AI, MallocCall->getType(), "calloc_bc", 3561 AI->getNextNode()); 3562 Value *Ops[] = { 3563 BI, ConstantInt::get(F->getContext(), APInt(8, 0, false)), Size, 3564 ConstantInt::get(Type::getInt1Ty(F->getContext()), false)}; 3565 3566 Type *Tys[] = {BI->getType(), MallocCall->getOperand(0)->getType()}; 3567 Module *M = F->getParent(); 3568 Function *Fn = Intrinsic::getDeclaration(M, Intrinsic::memset, Tys); 3569 CallInst::Create(Fn, Ops, "", BI->getNextNode()); 3570 } 3571 HasChanged = ChangeStatus::CHANGED; 3572 } 3573 3574 return HasChanged; 3575 } 3576 3577 /// Collection of all malloc calls in a function. 3578 SmallSetVector<Instruction *, 4> MallocCalls; 3579 3580 /// Collection of malloc calls that cannot be converted. 3581 DenseSet<const Instruction *> BadMallocCalls; 3582 3583 /// A map for each malloc call to the set of associated free calls. 3584 DenseMap<Instruction *, SmallPtrSet<Instruction *, 4>> FreesForMalloc; 3585 3586 ChangeStatus updateImpl(Attributor &A) override; 3587 }; 3588 3589 ChangeStatus AAHeapToStackImpl::updateImpl(Attributor &A) { 3590 const Function *F = getAssociatedFunction(); 3591 const auto *TLI = A.getInfoCache().getTargetLibraryInfoForFunction(*F); 3592 3593 auto UsesCheck = [&](Instruction &I) { 3594 SmallPtrSet<const Use *, 8> Visited; 3595 SmallVector<const Use *, 8> Worklist; 3596 3597 for (Use &U : I.uses()) 3598 Worklist.push_back(&U); 3599 3600 while (!Worklist.empty()) { 3601 const Use *U = Worklist.pop_back_val(); 3602 if (!Visited.insert(U).second) 3603 continue; 3604 3605 auto *UserI = U->getUser(); 3606 3607 if (isa<LoadInst>(UserI)) 3608 continue; 3609 if (auto *SI = dyn_cast<StoreInst>(UserI)) { 3610 if (SI->getValueOperand() == U->get()) { 3611 LLVM_DEBUG(dbgs() << "[H2S] escaping store to memory: " << *UserI << "\n"); 3612 return false; 3613 } 3614 // A store into the malloc'ed memory is fine. 3615 continue; 3616 } 3617 3618 // NOTE: Right now, if a function that has malloc pointer as an argument 3619 // frees memory, we assume that the malloc pointer is freed. 3620 3621 // TODO: Add nofree callsite argument attribute to indicate that pointer 3622 // argument is not freed. 3623 if (auto *CB = dyn_cast<CallBase>(UserI)) { 3624 if (!CB->isArgOperand(U)) 3625 continue; 3626 3627 if (CB->isLifetimeStartOrEnd()) 3628 continue; 3629 3630 // Record malloc. 3631 if (isFreeCall(UserI, TLI)) { 3632 FreesForMalloc[&I].insert( 3633 cast<Instruction>(const_cast<User *>(UserI))); 3634 continue; 3635 } 3636 3637 // If a function does not free memory we are fine 3638 const auto &NoFreeAA = 3639 A.getAAFor<AANoFree>(*this, IRPosition::callsite_function(*CB)); 3640 3641 unsigned ArgNo = U - CB->arg_begin(); 3642 const auto &NoCaptureAA = A.getAAFor<AANoCapture>( 3643 *this, IRPosition::callsite_argument(*CB, ArgNo)); 3644 3645 if (!NoCaptureAA.isAssumedNoCapture() || !NoFreeAA.isAssumedNoFree()) { 3646 LLVM_DEBUG(dbgs() << "[H2S] Bad user: " << *UserI << "\n"); 3647 return false; 3648 } 3649 continue; 3650 } 3651 3652 if (isa<GetElementPtrInst>(UserI) || isa<BitCastInst>(UserI)) { 3653 for (Use &U : UserI->uses()) 3654 Worklist.push_back(&U); 3655 continue; 3656 } 3657 3658 // Unknown user. 3659 LLVM_DEBUG(dbgs() << "[H2S] Unknown user: " << *UserI << "\n"); 3660 return false; 3661 } 3662 return true; 3663 }; 3664 3665 auto MallocCallocCheck = [&](Instruction &I) { 3666 if (BadMallocCalls.count(&I)) 3667 return true; 3668 3669 bool IsMalloc = isMallocLikeFn(&I, TLI); 3670 bool IsCalloc = !IsMalloc && isCallocLikeFn(&I, TLI); 3671 if (!IsMalloc && !IsCalloc) { 3672 BadMallocCalls.insert(&I); 3673 return true; 3674 } 3675 3676 if (IsMalloc) { 3677 if (auto *Size = dyn_cast<ConstantInt>(I.getOperand(0))) 3678 if (Size->getValue().sle(MaxHeapToStackSize)) 3679 if (UsesCheck(I)) { 3680 MallocCalls.insert(&I); 3681 return true; 3682 } 3683 } else if (IsCalloc) { 3684 bool Overflow = false; 3685 if (auto *Num = dyn_cast<ConstantInt>(I.getOperand(0))) 3686 if (auto *Size = dyn_cast<ConstantInt>(I.getOperand(1))) 3687 if ((Size->getValue().umul_ov(Num->getValue(), Overflow)) 3688 .sle(MaxHeapToStackSize)) 3689 if (!Overflow && UsesCheck(I)) { 3690 MallocCalls.insert(&I); 3691 return true; 3692 } 3693 } 3694 3695 BadMallocCalls.insert(&I); 3696 return true; 3697 }; 3698 3699 size_t NumBadMallocs = BadMallocCalls.size(); 3700 3701 A.checkForAllCallLikeInstructions(MallocCallocCheck, *this); 3702 3703 if (NumBadMallocs != BadMallocCalls.size()) 3704 return ChangeStatus::CHANGED; 3705 3706 return ChangeStatus::UNCHANGED; 3707 } 3708 3709 struct AAHeapToStackFunction final : public AAHeapToStackImpl { 3710 AAHeapToStackFunction(const IRPosition &IRP) : AAHeapToStackImpl(IRP) {} 3711 3712 /// See AbstractAttribute::trackStatistics() 3713 void trackStatistics() const override { 3714 STATS_DECL(MallocCalls, Function, 3715 "Number of MallocCalls converted to allocas"); 3716 BUILD_STAT_NAME(MallocCalls, Function) += MallocCalls.size(); 3717 } 3718 }; 3719 3720 /// -------------------- Memory Behavior Attributes ---------------------------- 3721 /// Includes read-none, read-only, and write-only. 3722 /// ---------------------------------------------------------------------------- 3723 struct AAMemoryBehaviorImpl : public AAMemoryBehavior { 3724 AAMemoryBehaviorImpl(const IRPosition &IRP) : AAMemoryBehavior(IRP) {} 3725 3726 /// See AbstractAttribute::initialize(...). 3727 void initialize(Attributor &A) override { 3728 intersectAssumedBits(BEST_STATE); 3729 getKnownStateFromValue(getIRPosition(), getState()); 3730 IRAttribute::initialize(A); 3731 } 3732 3733 /// Return the memory behavior information encoded in the IR for \p IRP. 3734 static void getKnownStateFromValue(const IRPosition &IRP, 3735 IntegerState &State) { 3736 SmallVector<Attribute, 2> Attrs; 3737 IRP.getAttrs(AttrKinds, Attrs); 3738 for (const Attribute &Attr : Attrs) { 3739 switch (Attr.getKindAsEnum()) { 3740 case Attribute::ReadNone: 3741 State.addKnownBits(NO_ACCESSES); 3742 break; 3743 case Attribute::ReadOnly: 3744 State.addKnownBits(NO_WRITES); 3745 break; 3746 case Attribute::WriteOnly: 3747 State.addKnownBits(NO_READS); 3748 break; 3749 default: 3750 llvm_unreachable("Unexpcted attribute!"); 3751 } 3752 } 3753 3754 if (auto *I = dyn_cast<Instruction>(&IRP.getAnchorValue())) { 3755 if (!I->mayReadFromMemory()) 3756 State.addKnownBits(NO_READS); 3757 if (!I->mayWriteToMemory()) 3758 State.addKnownBits(NO_WRITES); 3759 } 3760 } 3761 3762 /// See AbstractAttribute::getDeducedAttributes(...). 3763 void getDeducedAttributes(LLVMContext &Ctx, 3764 SmallVectorImpl<Attribute> &Attrs) const override { 3765 assert(Attrs.size() == 0); 3766 if (isAssumedReadNone()) 3767 Attrs.push_back(Attribute::get(Ctx, Attribute::ReadNone)); 3768 else if (isAssumedReadOnly()) 3769 Attrs.push_back(Attribute::get(Ctx, Attribute::ReadOnly)); 3770 else if (isAssumedWriteOnly()) 3771 Attrs.push_back(Attribute::get(Ctx, Attribute::WriteOnly)); 3772 assert(Attrs.size() <= 1); 3773 } 3774 3775 /// See AbstractAttribute::manifest(...). 3776 ChangeStatus manifest(Attributor &A) override { 3777 IRPosition &IRP = getIRPosition(); 3778 3779 // Check if we would improve the existing attributes first. 3780 SmallVector<Attribute, 4> DeducedAttrs; 3781 getDeducedAttributes(IRP.getAnchorValue().getContext(), DeducedAttrs); 3782 if (llvm::all_of(DeducedAttrs, [&](const Attribute &Attr) { 3783 return IRP.hasAttr(Attr.getKindAsEnum(), 3784 /* IgnoreSubsumingPositions */ true); 3785 })) 3786 return ChangeStatus::UNCHANGED; 3787 3788 // Clear existing attributes. 3789 IRP.removeAttrs(AttrKinds); 3790 3791 // Use the generic manifest method. 3792 return IRAttribute::manifest(A); 3793 } 3794 3795 /// See AbstractState::getAsStr(). 3796 const std::string getAsStr() const override { 3797 if (isAssumedReadNone()) 3798 return "readnone"; 3799 if (isAssumedReadOnly()) 3800 return "readonly"; 3801 if (isAssumedWriteOnly()) 3802 return "writeonly"; 3803 return "may-read/write"; 3804 } 3805 3806 /// The set of IR attributes AAMemoryBehavior deals with. 3807 static const Attribute::AttrKind AttrKinds[3]; 3808 }; 3809 3810 const Attribute::AttrKind AAMemoryBehaviorImpl::AttrKinds[] = { 3811 Attribute::ReadNone, Attribute::ReadOnly, Attribute::WriteOnly}; 3812 3813 /// Memory behavior attribute for a floating value. 3814 struct AAMemoryBehaviorFloating : AAMemoryBehaviorImpl { 3815 AAMemoryBehaviorFloating(const IRPosition &IRP) : AAMemoryBehaviorImpl(IRP) {} 3816 3817 /// See AbstractAttribute::initialize(...). 3818 void initialize(Attributor &A) override { 3819 AAMemoryBehaviorImpl::initialize(A); 3820 // Initialize the use vector with all direct uses of the associated value. 3821 for (const Use &U : getAssociatedValue().uses()) 3822 Uses.insert(&U); 3823 } 3824 3825 /// See AbstractAttribute::updateImpl(...). 3826 ChangeStatus updateImpl(Attributor &A) override; 3827 3828 /// See AbstractAttribute::trackStatistics() 3829 void trackStatistics() const override { 3830 if (isAssumedReadNone()) 3831 STATS_DECLTRACK_FLOATING_ATTR(readnone) 3832 else if (isAssumedReadOnly()) 3833 STATS_DECLTRACK_FLOATING_ATTR(readonly) 3834 else if (isAssumedWriteOnly()) 3835 STATS_DECLTRACK_FLOATING_ATTR(writeonly) 3836 } 3837 3838 private: 3839 /// Return true if users of \p UserI might access the underlying 3840 /// variable/location described by \p U and should therefore be analyzed. 3841 bool followUsersOfUseIn(Attributor &A, const Use *U, 3842 const Instruction *UserI); 3843 3844 /// Update the state according to the effect of use \p U in \p UserI. 3845 void analyzeUseIn(Attributor &A, const Use *U, const Instruction *UserI); 3846 3847 protected: 3848 /// Container for (transitive) uses of the associated argument. 3849 SetVector<const Use *> Uses; 3850 }; 3851 3852 /// Memory behavior attribute for function argument. 3853 struct AAMemoryBehaviorArgument : AAMemoryBehaviorFloating { 3854 AAMemoryBehaviorArgument(const IRPosition &IRP) 3855 : AAMemoryBehaviorFloating(IRP) {} 3856 3857 /// See AbstractAttribute::initialize(...). 3858 void initialize(Attributor &A) override { 3859 AAMemoryBehaviorFloating::initialize(A); 3860 3861 // Initialize the use vector with all direct uses of the associated value. 3862 Argument *Arg = getAssociatedArgument(); 3863 if (!Arg || !Arg->getParent()->hasExactDefinition()) 3864 indicatePessimisticFixpoint(); 3865 } 3866 3867 ChangeStatus manifest(Attributor &A) override { 3868 // TODO: From readattrs.ll: "inalloca parameters are always 3869 // considered written" 3870 if (hasAttr({Attribute::InAlloca})) { 3871 removeKnownBits(NO_WRITES); 3872 removeAssumedBits(NO_WRITES); 3873 } 3874 return AAMemoryBehaviorFloating::manifest(A); 3875 } 3876 3877 3878 /// See AbstractAttribute::trackStatistics() 3879 void trackStatistics() const override { 3880 if (isAssumedReadNone()) 3881 STATS_DECLTRACK_ARG_ATTR(readnone) 3882 else if (isAssumedReadOnly()) 3883 STATS_DECLTRACK_ARG_ATTR(readonly) 3884 else if (isAssumedWriteOnly()) 3885 STATS_DECLTRACK_ARG_ATTR(writeonly) 3886 } 3887 }; 3888 3889 struct AAMemoryBehaviorCallSiteArgument final : AAMemoryBehaviorArgument { 3890 AAMemoryBehaviorCallSiteArgument(const IRPosition &IRP) 3891 : AAMemoryBehaviorArgument(IRP) {} 3892 3893 /// See AbstractAttribute::updateImpl(...). 3894 ChangeStatus updateImpl(Attributor &A) override { 3895 // TODO: Once we have call site specific value information we can provide 3896 // call site specific liveness liveness information and then it makes 3897 // sense to specialize attributes for call sites arguments instead of 3898 // redirecting requests to the callee argument. 3899 Argument *Arg = getAssociatedArgument(); 3900 const IRPosition &ArgPos = IRPosition::argument(*Arg); 3901 auto &ArgAA = A.getAAFor<AAMemoryBehavior>(*this, ArgPos); 3902 return clampStateAndIndicateChange( 3903 getState(), 3904 static_cast<const AANoCapture::StateType &>(ArgAA.getState())); 3905 } 3906 3907 /// See AbstractAttribute::trackStatistics() 3908 void trackStatistics() const override { 3909 if (isAssumedReadNone()) 3910 STATS_DECLTRACK_CSARG_ATTR(readnone) 3911 else if (isAssumedReadOnly()) 3912 STATS_DECLTRACK_CSARG_ATTR(readonly) 3913 else if (isAssumedWriteOnly()) 3914 STATS_DECLTRACK_CSARG_ATTR(writeonly) 3915 } 3916 }; 3917 3918 /// Memory behavior attribute for a call site return position. 3919 struct AAMemoryBehaviorCallSiteReturned final : AAMemoryBehaviorFloating { 3920 AAMemoryBehaviorCallSiteReturned(const IRPosition &IRP) 3921 : AAMemoryBehaviorFloating(IRP) {} 3922 3923 /// See AbstractAttribute::manifest(...). 3924 ChangeStatus manifest(Attributor &A) override { 3925 // We do not annotate returned values. 3926 return ChangeStatus::UNCHANGED; 3927 } 3928 3929 /// See AbstractAttribute::trackStatistics() 3930 void trackStatistics() const override {} 3931 }; 3932 3933 /// An AA to represent the memory behavior function attributes. 3934 struct AAMemoryBehaviorFunction final : public AAMemoryBehaviorImpl { 3935 AAMemoryBehaviorFunction(const IRPosition &IRP) : AAMemoryBehaviorImpl(IRP) {} 3936 3937 /// See AbstractAttribute::updateImpl(Attributor &A). 3938 virtual ChangeStatus updateImpl(Attributor &A) override; 3939 3940 /// See AbstractAttribute::manifest(...). 3941 ChangeStatus manifest(Attributor &A) override { 3942 Function &F = cast<Function>(getAnchorValue()); 3943 if (isAssumedReadNone()) { 3944 F.removeFnAttr(Attribute::ArgMemOnly); 3945 F.removeFnAttr(Attribute::InaccessibleMemOnly); 3946 F.removeFnAttr(Attribute::InaccessibleMemOrArgMemOnly); 3947 } 3948 return AAMemoryBehaviorImpl::manifest(A); 3949 } 3950 3951 /// See AbstractAttribute::trackStatistics() 3952 void trackStatistics() const override { 3953 if (isAssumedReadNone()) 3954 STATS_DECLTRACK_FN_ATTR(readnone) 3955 else if (isAssumedReadOnly()) 3956 STATS_DECLTRACK_FN_ATTR(readonly) 3957 else if (isAssumedWriteOnly()) 3958 STATS_DECLTRACK_FN_ATTR(writeonly) 3959 } 3960 }; 3961 3962 /// AAMemoryBehavior attribute for call sites. 3963 struct AAMemoryBehaviorCallSite final : AAMemoryBehaviorImpl { 3964 AAMemoryBehaviorCallSite(const IRPosition &IRP) : AAMemoryBehaviorImpl(IRP) {} 3965 3966 /// See AbstractAttribute::initialize(...). 3967 void initialize(Attributor &A) override { 3968 AAMemoryBehaviorImpl::initialize(A); 3969 Function *F = getAssociatedFunction(); 3970 if (!F || !F->hasExactDefinition()) 3971 indicatePessimisticFixpoint(); 3972 } 3973 3974 /// See AbstractAttribute::updateImpl(...). 3975 ChangeStatus updateImpl(Attributor &A) override { 3976 // TODO: Once we have call site specific value information we can provide 3977 // call site specific liveness liveness information and then it makes 3978 // sense to specialize attributes for call sites arguments instead of 3979 // redirecting requests to the callee argument. 3980 Function *F = getAssociatedFunction(); 3981 const IRPosition &FnPos = IRPosition::function(*F); 3982 auto &FnAA = A.getAAFor<AAMemoryBehavior>(*this, FnPos); 3983 return clampStateAndIndicateChange( 3984 getState(), static_cast<const AAAlign::StateType &>(FnAA.getState())); 3985 } 3986 3987 /// See AbstractAttribute::trackStatistics() 3988 void trackStatistics() const override { 3989 if (isAssumedReadNone()) 3990 STATS_DECLTRACK_CS_ATTR(readnone) 3991 else if (isAssumedReadOnly()) 3992 STATS_DECLTRACK_CS_ATTR(readonly) 3993 else if (isAssumedWriteOnly()) 3994 STATS_DECLTRACK_CS_ATTR(writeonly) 3995 } 3996 }; 3997 } // namespace 3998 3999 ChangeStatus AAMemoryBehaviorFunction::updateImpl(Attributor &A) { 4000 4001 // The current assumed state used to determine a change. 4002 auto AssumedState = getAssumed(); 4003 4004 auto CheckRWInst = [&](Instruction &I) { 4005 // If the instruction has an own memory behavior state, use it to restrict 4006 // the local state. No further analysis is required as the other memory 4007 // state is as optimistic as it gets. 4008 if (ImmutableCallSite ICS = ImmutableCallSite(&I)) { 4009 const auto &MemBehaviorAA = A.getAAFor<AAMemoryBehavior>( 4010 *this, IRPosition::callsite_function(ICS)); 4011 intersectAssumedBits(MemBehaviorAA.getAssumed()); 4012 return !isAtFixpoint(); 4013 } 4014 4015 // Remove access kind modifiers if necessary. 4016 if (I.mayReadFromMemory()) 4017 removeAssumedBits(NO_READS); 4018 if (I.mayWriteToMemory()) 4019 removeAssumedBits(NO_WRITES); 4020 return !isAtFixpoint(); 4021 }; 4022 4023 if (!A.checkForAllReadWriteInstructions(CheckRWInst, *this)) 4024 return indicatePessimisticFixpoint(); 4025 4026 return (AssumedState != getAssumed()) ? ChangeStatus::CHANGED 4027 : ChangeStatus::UNCHANGED; 4028 } 4029 4030 ChangeStatus AAMemoryBehaviorFloating::updateImpl(Attributor &A) { 4031 4032 const IRPosition &IRP = getIRPosition(); 4033 const IRPosition &FnPos = IRPosition::function_scope(IRP); 4034 AAMemoryBehavior::StateType &S = getState(); 4035 4036 // First, check the function scope. We take the known information and we avoid 4037 // work if the assumed information implies the current assumed information for 4038 // this attribute. 4039 const auto &FnMemAA = A.getAAFor<AAMemoryBehavior>(*this, FnPos); 4040 S.addKnownBits(FnMemAA.getKnown()); 4041 if ((S.getAssumed() & FnMemAA.getAssumed()) == S.getAssumed()) 4042 return ChangeStatus::UNCHANGED; 4043 4044 // Make sure the value is not captured (except through "return"), if 4045 // it is, any information derived would be irrelevant anyway as we cannot 4046 // check the potential aliases introduced by the capture. However, no need 4047 // to fall back to anythign less optimistic than the function state. 4048 const auto &ArgNoCaptureAA = A.getAAFor<AANoCapture>(*this, IRP); 4049 if (!ArgNoCaptureAA.isAssumedNoCaptureMaybeReturned()) { 4050 S.intersectAssumedBits(FnMemAA.getAssumed()); 4051 return ChangeStatus::CHANGED; 4052 } 4053 4054 // The current assumed state used to determine a change. 4055 auto AssumedState = S.getAssumed(); 4056 4057 // Liveness information to exclude dead users. 4058 // TODO: Take the FnPos once we have call site specific liveness information. 4059 const auto &LivenessAA = A.getAAFor<AAIsDead>( 4060 *this, IRPosition::function(*IRP.getAssociatedFunction())); 4061 4062 // Visit and expand uses until all are analyzed or a fixpoint is reached. 4063 for (unsigned i = 0; i < Uses.size() && !isAtFixpoint(); i++) { 4064 const Use *U = Uses[i]; 4065 Instruction *UserI = cast<Instruction>(U->getUser()); 4066 LLVM_DEBUG(dbgs() << "[AAMemoryBehavior] Use: " << **U << " in " << *UserI 4067 << " [Dead: " << (LivenessAA.isAssumedDead(UserI)) 4068 << "]\n"); 4069 if (LivenessAA.isAssumedDead(UserI)) 4070 continue; 4071 4072 // Check if the users of UserI should also be visited. 4073 if (followUsersOfUseIn(A, U, UserI)) 4074 for (const Use &UserIUse : UserI->uses()) 4075 Uses.insert(&UserIUse); 4076 4077 // If UserI might touch memory we analyze the use in detail. 4078 if (UserI->mayReadOrWriteMemory()) 4079 analyzeUseIn(A, U, UserI); 4080 } 4081 4082 return (AssumedState != getAssumed()) ? ChangeStatus::CHANGED 4083 : ChangeStatus::UNCHANGED; 4084 } 4085 4086 bool AAMemoryBehaviorFloating::followUsersOfUseIn(Attributor &A, const Use *U, 4087 const Instruction *UserI) { 4088 // The loaded value is unrelated to the pointer argument, no need to 4089 // follow the users of the load. 4090 if (isa<LoadInst>(UserI)) 4091 return false; 4092 4093 // By default we follow all uses assuming UserI might leak information on U, 4094 // we have special handling for call sites operands though. 4095 ImmutableCallSite ICS(UserI); 4096 if (!ICS || !ICS.isArgOperand(U)) 4097 return true; 4098 4099 // If the use is a call argument known not to be captured, the users of 4100 // the call do not need to be visited because they have to be unrelated to 4101 // the input. Note that this check is not trivial even though we disallow 4102 // general capturing of the underlying argument. The reason is that the 4103 // call might the argument "through return", which we allow and for which we 4104 // need to check call users. 4105 unsigned ArgNo = ICS.getArgumentNo(U); 4106 const auto &ArgNoCaptureAA = 4107 A.getAAFor<AANoCapture>(*this, IRPosition::callsite_argument(ICS, ArgNo)); 4108 return !ArgNoCaptureAA.isAssumedNoCapture(); 4109 } 4110 4111 void AAMemoryBehaviorFloating::analyzeUseIn(Attributor &A, const Use *U, 4112 const Instruction *UserI) { 4113 assert(UserI->mayReadOrWriteMemory()); 4114 4115 switch (UserI->getOpcode()) { 4116 default: 4117 // TODO: Handle all atomics and other side-effect operations we know of. 4118 break; 4119 case Instruction::Load: 4120 // Loads cause the NO_READS property to disappear. 4121 removeAssumedBits(NO_READS); 4122 return; 4123 4124 case Instruction::Store: 4125 // Stores cause the NO_WRITES property to disappear if the use is the 4126 // pointer operand. Note that we do assume that capturing was taken care of 4127 // somewhere else. 4128 if (cast<StoreInst>(UserI)->getPointerOperand() == U->get()) 4129 removeAssumedBits(NO_WRITES); 4130 return; 4131 4132 case Instruction::Call: 4133 case Instruction::CallBr: 4134 case Instruction::Invoke: { 4135 // For call sites we look at the argument memory behavior attribute (this 4136 // could be recursive!) in order to restrict our own state. 4137 ImmutableCallSite ICS(UserI); 4138 4139 // Give up on operand bundles. 4140 if (ICS.isBundleOperand(U)) { 4141 indicatePessimisticFixpoint(); 4142 return; 4143 } 4144 4145 // Calling a function does read the function pointer, maybe write it if the 4146 // function is self-modifying. 4147 if (ICS.isCallee(U)) { 4148 removeAssumedBits(NO_READS); 4149 break; 4150 } 4151 4152 // Adjust the possible access behavior based on the information on the 4153 // argument. 4154 unsigned ArgNo = ICS.getArgumentNo(U); 4155 const IRPosition &ArgPos = IRPosition::callsite_argument(ICS, ArgNo); 4156 const auto &MemBehaviorAA = A.getAAFor<AAMemoryBehavior>(*this, ArgPos); 4157 // "assumed" has at most the same bits as the MemBehaviorAA assumed 4158 // and at least "known". 4159 intersectAssumedBits(MemBehaviorAA.getAssumed()); 4160 return; 4161 } 4162 }; 4163 4164 // Generally, look at the "may-properties" and adjust the assumed state if we 4165 // did not trigger special handling before. 4166 if (UserI->mayReadFromMemory()) 4167 removeAssumedBits(NO_READS); 4168 if (UserI->mayWriteToMemory()) 4169 removeAssumedBits(NO_WRITES); 4170 } 4171 4172 /// ---------------------------------------------------------------------------- 4173 /// Attributor 4174 /// ---------------------------------------------------------------------------- 4175 4176 bool Attributor::isAssumedDead(const AbstractAttribute &AA, 4177 const AAIsDead *LivenessAA) { 4178 const Instruction *CtxI = AA.getIRPosition().getCtxI(); 4179 if (!CtxI) 4180 return false; 4181 4182 if (!LivenessAA) 4183 LivenessAA = 4184 &getAAFor<AAIsDead>(AA, IRPosition::function(*CtxI->getFunction()), 4185 /* TrackDependence */ false); 4186 4187 // Don't check liveness for AAIsDead. 4188 if (&AA == LivenessAA) 4189 return false; 4190 4191 if (!LivenessAA->isAssumedDead(CtxI)) 4192 return false; 4193 4194 // We actually used liveness information so we have to record a dependence. 4195 recordDependence(*LivenessAA, AA); 4196 4197 return true; 4198 } 4199 4200 bool Attributor::checkForAllCallSites( 4201 const function_ref<bool(AbstractCallSite)> &Pred, 4202 const AbstractAttribute &QueryingAA, bool RequireAllCallSites) { 4203 // We can try to determine information from 4204 // the call sites. However, this is only possible all call sites are known, 4205 // hence the function has internal linkage. 4206 const IRPosition &IRP = QueryingAA.getIRPosition(); 4207 const Function *AssociatedFunction = IRP.getAssociatedFunction(); 4208 if (!AssociatedFunction) { 4209 LLVM_DEBUG(dbgs() << "[Attributor] No function associated with " << IRP 4210 << "\n"); 4211 return false; 4212 } 4213 4214 return checkForAllCallSites(Pred, *AssociatedFunction, RequireAllCallSites, 4215 &QueryingAA); 4216 } 4217 4218 bool Attributor::checkForAllCallSites( 4219 const function_ref<bool(AbstractCallSite)> &Pred, const Function &Fn, 4220 bool RequireAllCallSites, const AbstractAttribute *QueryingAA) { 4221 if (RequireAllCallSites && !Fn.hasLocalLinkage()) { 4222 LLVM_DEBUG( 4223 dbgs() 4224 << "[Attributor] Function " << Fn.getName() 4225 << " has no internal linkage, hence not all call sites are known\n"); 4226 return false; 4227 } 4228 4229 for (const Use &U : Fn.uses()) { 4230 AbstractCallSite ACS(&U); 4231 if (!ACS) { 4232 LLVM_DEBUG(dbgs() << "[Attributor] Function " 4233 << Fn.getName() 4234 << " has non call site use " << *U.get() << " in " 4235 << *U.getUser() << "\n"); 4236 return false; 4237 } 4238 4239 Instruction *I = ACS.getInstruction(); 4240 Function *Caller = I->getFunction(); 4241 4242 const auto *LivenessAA = 4243 lookupAAFor<AAIsDead>(IRPosition::function(*Caller), QueryingAA, 4244 /* TrackDependence */ false); 4245 4246 // Skip dead calls. 4247 if (LivenessAA && LivenessAA->isAssumedDead(I)) { 4248 // We actually used liveness information so we have to record a 4249 // dependence. 4250 if (QueryingAA) 4251 recordDependence(*LivenessAA, *QueryingAA); 4252 continue; 4253 } 4254 4255 const Use *EffectiveUse = 4256 ACS.isCallbackCall() ? &ACS.getCalleeUseForCallback() : &U; 4257 if (!ACS.isCallee(EffectiveUse)) { 4258 if (!RequireAllCallSites) 4259 continue; 4260 LLVM_DEBUG(dbgs() << "[Attributor] User " << EffectiveUse->getUser() 4261 << " is an invalid use of " 4262 << Fn.getName() << "\n"); 4263 return false; 4264 } 4265 4266 if (Pred(ACS)) 4267 continue; 4268 4269 LLVM_DEBUG(dbgs() << "[Attributor] Call site callback failed for " 4270 << *ACS.getInstruction() << "\n"); 4271 return false; 4272 } 4273 4274 return true; 4275 } 4276 4277 bool Attributor::checkForAllReturnedValuesAndReturnInsts( 4278 const function_ref<bool(Value &, const SmallSetVector<ReturnInst *, 4> &)> 4279 &Pred, 4280 const AbstractAttribute &QueryingAA) { 4281 4282 const IRPosition &IRP = QueryingAA.getIRPosition(); 4283 // Since we need to provide return instructions we have to have an exact 4284 // definition. 4285 const Function *AssociatedFunction = IRP.getAssociatedFunction(); 4286 if (!AssociatedFunction) 4287 return false; 4288 4289 // If this is a call site query we use the call site specific return values 4290 // and liveness information. 4291 // TODO: use the function scope once we have call site AAReturnedValues. 4292 const IRPosition &QueryIRP = IRPosition::function(*AssociatedFunction); 4293 const auto &AARetVal = getAAFor<AAReturnedValues>(QueryingAA, QueryIRP); 4294 if (!AARetVal.getState().isValidState()) 4295 return false; 4296 4297 return AARetVal.checkForAllReturnedValuesAndReturnInsts(Pred); 4298 } 4299 4300 bool Attributor::checkForAllReturnedValues( 4301 const function_ref<bool(Value &)> &Pred, 4302 const AbstractAttribute &QueryingAA) { 4303 4304 const IRPosition &IRP = QueryingAA.getIRPosition(); 4305 const Function *AssociatedFunction = IRP.getAssociatedFunction(); 4306 if (!AssociatedFunction) 4307 return false; 4308 4309 // TODO: use the function scope once we have call site AAReturnedValues. 4310 const IRPosition &QueryIRP = IRPosition::function(*AssociatedFunction); 4311 const auto &AARetVal = getAAFor<AAReturnedValues>(QueryingAA, QueryIRP); 4312 if (!AARetVal.getState().isValidState()) 4313 return false; 4314 4315 return AARetVal.checkForAllReturnedValuesAndReturnInsts( 4316 [&](Value &RV, const SmallSetVector<ReturnInst *, 4> &) { 4317 return Pred(RV); 4318 }); 4319 } 4320 4321 static bool 4322 checkForAllInstructionsImpl(InformationCache::OpcodeInstMapTy &OpcodeInstMap, 4323 const function_ref<bool(Instruction &)> &Pred, 4324 const AAIsDead *LivenessAA, bool &AnyDead, 4325 const ArrayRef<unsigned> &Opcodes) { 4326 for (unsigned Opcode : Opcodes) { 4327 for (Instruction *I : OpcodeInstMap[Opcode]) { 4328 // Skip dead instructions. 4329 if (LivenessAA && LivenessAA->isAssumedDead(I)) { 4330 AnyDead = true; 4331 continue; 4332 } 4333 4334 if (!Pred(*I)) 4335 return false; 4336 } 4337 } 4338 return true; 4339 } 4340 4341 bool Attributor::checkForAllInstructions( 4342 const llvm::function_ref<bool(Instruction &)> &Pred, 4343 const AbstractAttribute &QueryingAA, const ArrayRef<unsigned> &Opcodes) { 4344 4345 const IRPosition &IRP = QueryingAA.getIRPosition(); 4346 // Since we need to provide instructions we have to have an exact definition. 4347 const Function *AssociatedFunction = IRP.getAssociatedFunction(); 4348 if (!AssociatedFunction) 4349 return false; 4350 4351 // TODO: use the function scope once we have call site AAReturnedValues. 4352 const IRPosition &QueryIRP = IRPosition::function(*AssociatedFunction); 4353 const auto &LivenessAA = 4354 getAAFor<AAIsDead>(QueryingAA, QueryIRP, /* TrackDependence */ false); 4355 bool AnyDead = false; 4356 4357 auto &OpcodeInstMap = 4358 InfoCache.getOpcodeInstMapForFunction(*AssociatedFunction); 4359 if (!checkForAllInstructionsImpl(OpcodeInstMap, Pred, &LivenessAA, AnyDead, 4360 Opcodes)) 4361 return false; 4362 4363 // If we actually used liveness information so we have to record a dependence. 4364 if (AnyDead) 4365 recordDependence(LivenessAA, QueryingAA); 4366 4367 return true; 4368 } 4369 4370 bool Attributor::checkForAllReadWriteInstructions( 4371 const llvm::function_ref<bool(Instruction &)> &Pred, 4372 AbstractAttribute &QueryingAA) { 4373 4374 const Function *AssociatedFunction = 4375 QueryingAA.getIRPosition().getAssociatedFunction(); 4376 if (!AssociatedFunction) 4377 return false; 4378 4379 // TODO: use the function scope once we have call site AAReturnedValues. 4380 const IRPosition &QueryIRP = IRPosition::function(*AssociatedFunction); 4381 const auto &LivenessAA = 4382 getAAFor<AAIsDead>(QueryingAA, QueryIRP, /* TrackDependence */ false); 4383 bool AnyDead = false; 4384 4385 for (Instruction *I : 4386 InfoCache.getReadOrWriteInstsForFunction(*AssociatedFunction)) { 4387 // Skip dead instructions. 4388 if (LivenessAA.isAssumedDead(I)) { 4389 AnyDead = true; 4390 continue; 4391 } 4392 4393 if (!Pred(*I)) 4394 return false; 4395 } 4396 4397 // If we actually used liveness information so we have to record a dependence. 4398 if (AnyDead) 4399 recordDependence(LivenessAA, QueryingAA); 4400 4401 return true; 4402 } 4403 4404 ChangeStatus Attributor::run(Module &M) { 4405 LLVM_DEBUG(dbgs() << "[Attributor] Identified and initialized " 4406 << AllAbstractAttributes.size() 4407 << " abstract attributes.\n"); 4408 4409 // Now that all abstract attributes are collected and initialized we start 4410 // the abstract analysis. 4411 4412 unsigned IterationCounter = 1; 4413 4414 SmallVector<AbstractAttribute *, 64> ChangedAAs; 4415 SetVector<AbstractAttribute *> Worklist; 4416 Worklist.insert(AllAbstractAttributes.begin(), AllAbstractAttributes.end()); 4417 4418 bool RecomputeDependences = false; 4419 4420 do { 4421 // Remember the size to determine new attributes. 4422 size_t NumAAs = AllAbstractAttributes.size(); 4423 LLVM_DEBUG(dbgs() << "\n\n[Attributor] #Iteration: " << IterationCounter 4424 << ", Worklist size: " << Worklist.size() << "\n"); 4425 4426 // If dependences (=QueryMap) are recomputed we have to look at all abstract 4427 // attributes again, regardless of what changed in the last iteration. 4428 if (RecomputeDependences) { 4429 LLVM_DEBUG( 4430 dbgs() << "[Attributor] Run all AAs to recompute dependences\n"); 4431 QueryMap.clear(); 4432 ChangedAAs.clear(); 4433 Worklist.insert(AllAbstractAttributes.begin(), 4434 AllAbstractAttributes.end()); 4435 } 4436 4437 // Add all abstract attributes that are potentially dependent on one that 4438 // changed to the work list. 4439 for (AbstractAttribute *ChangedAA : ChangedAAs) { 4440 auto &QuerriedAAs = QueryMap[ChangedAA]; 4441 Worklist.insert(QuerriedAAs.begin(), QuerriedAAs.end()); 4442 } 4443 4444 LLVM_DEBUG(dbgs() << "[Attributor] #Iteration: " << IterationCounter 4445 << ", Worklist+Dependent size: " << Worklist.size() 4446 << "\n"); 4447 4448 // Reset the changed set. 4449 ChangedAAs.clear(); 4450 4451 // Update all abstract attribute in the work list and record the ones that 4452 // changed. 4453 for (AbstractAttribute *AA : Worklist) 4454 if (!isAssumedDead(*AA, nullptr)) 4455 if (AA->update(*this) == ChangeStatus::CHANGED) 4456 ChangedAAs.push_back(AA); 4457 4458 // Check if we recompute the dependences in the next iteration. 4459 RecomputeDependences = (DepRecomputeInterval > 0 && 4460 IterationCounter % DepRecomputeInterval == 0); 4461 4462 // Add attributes to the changed set if they have been created in the last 4463 // iteration. 4464 ChangedAAs.append(AllAbstractAttributes.begin() + NumAAs, 4465 AllAbstractAttributes.end()); 4466 4467 // Reset the work list and repopulate with the changed abstract attributes. 4468 // Note that dependent ones are added above. 4469 Worklist.clear(); 4470 Worklist.insert(ChangedAAs.begin(), ChangedAAs.end()); 4471 4472 } while (!Worklist.empty() && (IterationCounter++ < MaxFixpointIterations || 4473 VerifyMaxFixpointIterations)); 4474 4475 LLVM_DEBUG(dbgs() << "\n[Attributor] Fixpoint iteration done after: " 4476 << IterationCounter << "/" << MaxFixpointIterations 4477 << " iterations\n"); 4478 4479 size_t NumFinalAAs = AllAbstractAttributes.size(); 4480 4481 // Reset abstract arguments not settled in a sound fixpoint by now. This 4482 // happens when we stopped the fixpoint iteration early. Note that only the 4483 // ones marked as "changed" *and* the ones transitively depending on them 4484 // need to be reverted to a pessimistic state. Others might not be in a 4485 // fixpoint state but we can use the optimistic results for them anyway. 4486 SmallPtrSet<AbstractAttribute *, 32> Visited; 4487 for (unsigned u = 0; u < ChangedAAs.size(); u++) { 4488 AbstractAttribute *ChangedAA = ChangedAAs[u]; 4489 if (!Visited.insert(ChangedAA).second) 4490 continue; 4491 4492 AbstractState &State = ChangedAA->getState(); 4493 if (!State.isAtFixpoint()) { 4494 State.indicatePessimisticFixpoint(); 4495 4496 NumAttributesTimedOut++; 4497 } 4498 4499 auto &QuerriedAAs = QueryMap[ChangedAA]; 4500 ChangedAAs.append(QuerriedAAs.begin(), QuerriedAAs.end()); 4501 } 4502 4503 LLVM_DEBUG({ 4504 if (!Visited.empty()) 4505 dbgs() << "\n[Attributor] Finalized " << Visited.size() 4506 << " abstract attributes.\n"; 4507 }); 4508 4509 unsigned NumManifested = 0; 4510 unsigned NumAtFixpoint = 0; 4511 ChangeStatus ManifestChange = ChangeStatus::UNCHANGED; 4512 for (AbstractAttribute *AA : AllAbstractAttributes) { 4513 AbstractState &State = AA->getState(); 4514 4515 // If there is not already a fixpoint reached, we can now take the 4516 // optimistic state. This is correct because we enforced a pessimistic one 4517 // on abstract attributes that were transitively dependent on a changed one 4518 // already above. 4519 if (!State.isAtFixpoint()) 4520 State.indicateOptimisticFixpoint(); 4521 4522 // If the state is invalid, we do not try to manifest it. 4523 if (!State.isValidState()) 4524 continue; 4525 4526 // Skip dead code. 4527 if (isAssumedDead(*AA, nullptr)) 4528 continue; 4529 // Manifest the state and record if we changed the IR. 4530 ChangeStatus LocalChange = AA->manifest(*this); 4531 if (LocalChange == ChangeStatus::CHANGED && AreStatisticsEnabled()) 4532 AA->trackStatistics(); 4533 4534 ManifestChange = ManifestChange | LocalChange; 4535 4536 NumAtFixpoint++; 4537 NumManifested += (LocalChange == ChangeStatus::CHANGED); 4538 } 4539 4540 (void)NumManifested; 4541 (void)NumAtFixpoint; 4542 LLVM_DEBUG(dbgs() << "\n[Attributor] Manifested " << NumManifested 4543 << " arguments while " << NumAtFixpoint 4544 << " were in a valid fixpoint state\n"); 4545 4546 NumAttributesManifested += NumManifested; 4547 NumAttributesValidFixpoint += NumAtFixpoint; 4548 4549 (void)NumFinalAAs; 4550 assert( 4551 NumFinalAAs == AllAbstractAttributes.size() && 4552 "Expected the final number of abstract attributes to remain unchanged!"); 4553 4554 // Delete stuff at the end to avoid invalid references and a nice order. 4555 { 4556 LLVM_DEBUG(dbgs() << "\n[Attributor] Delete at least " 4557 << ToBeDeletedFunctions.size() << " functions and " 4558 << ToBeDeletedBlocks.size() << " blocks and " 4559 << ToBeDeletedInsts.size() << " instructions\n"); 4560 for (Instruction *I : ToBeDeletedInsts) { 4561 if (!I->use_empty()) 4562 I->replaceAllUsesWith(UndefValue::get(I->getType())); 4563 I->eraseFromParent(); 4564 } 4565 4566 if (unsigned NumDeadBlocks = ToBeDeletedBlocks.size()) { 4567 SmallVector<BasicBlock *, 8> ToBeDeletedBBs; 4568 ToBeDeletedBBs.reserve(NumDeadBlocks); 4569 ToBeDeletedBBs.append(ToBeDeletedBlocks.begin(), ToBeDeletedBlocks.end()); 4570 DeleteDeadBlocks(ToBeDeletedBBs); 4571 STATS_DECLTRACK(AAIsDead, BasicBlock, 4572 "Number of dead basic blocks deleted."); 4573 } 4574 4575 STATS_DECL(AAIsDead, Function, "Number of dead functions deleted."); 4576 for (Function *Fn : ToBeDeletedFunctions) { 4577 Fn->replaceAllUsesWith(UndefValue::get(Fn->getType())); 4578 Fn->eraseFromParent(); 4579 STATS_TRACK(AAIsDead, Function); 4580 } 4581 4582 // Identify dead internal functions and delete them. This happens outside 4583 // the other fixpoint analysis as we might treat potentially dead functions 4584 // as live to lower the number of iterations. If they happen to be dead, the 4585 // below fixpoint loop will identify and eliminate them. 4586 SmallVector<Function *, 8> InternalFns; 4587 for (Function &F : M) 4588 if (F.hasLocalLinkage()) 4589 InternalFns.push_back(&F); 4590 4591 bool FoundDeadFn = true; 4592 while (FoundDeadFn) { 4593 FoundDeadFn = false; 4594 for (unsigned u = 0, e = InternalFns.size(); u < e; ++u) { 4595 Function *F = InternalFns[u]; 4596 if (!F) 4597 continue; 4598 4599 const auto *LivenessAA = 4600 lookupAAFor<AAIsDead>(IRPosition::function(*F)); 4601 if (LivenessAA && 4602 !checkForAllCallSites([](AbstractCallSite ACS) { return false; }, 4603 *LivenessAA, true)) 4604 continue; 4605 4606 STATS_TRACK(AAIsDead, Function); 4607 F->replaceAllUsesWith(UndefValue::get(F->getType())); 4608 F->eraseFromParent(); 4609 InternalFns[u] = nullptr; 4610 FoundDeadFn = true; 4611 } 4612 } 4613 } 4614 4615 if (VerifyMaxFixpointIterations && 4616 IterationCounter != MaxFixpointIterations) { 4617 errs() << "\n[Attributor] Fixpoint iteration done after: " 4618 << IterationCounter << "/" << MaxFixpointIterations 4619 << " iterations\n"; 4620 llvm_unreachable("The fixpoint was not reached with exactly the number of " 4621 "specified iterations!"); 4622 } 4623 4624 return ManifestChange; 4625 } 4626 4627 void Attributor::initializeInformationCache(Function &F) { 4628 4629 // Walk all instructions to find interesting instructions that might be 4630 // queried by abstract attributes during their initialization or update. 4631 // This has to happen before we create attributes. 4632 auto &ReadOrWriteInsts = InfoCache.FuncRWInstsMap[&F]; 4633 auto &InstOpcodeMap = InfoCache.FuncInstOpcodeMap[&F]; 4634 4635 for (Instruction &I : instructions(&F)) { 4636 bool IsInterestingOpcode = false; 4637 4638 // To allow easy access to all instructions in a function with a given 4639 // opcode we store them in the InfoCache. As not all opcodes are interesting 4640 // to concrete attributes we only cache the ones that are as identified in 4641 // the following switch. 4642 // Note: There are no concrete attributes now so this is initially empty. 4643 switch (I.getOpcode()) { 4644 default: 4645 assert((!ImmutableCallSite(&I)) && (!isa<CallBase>(&I)) && 4646 "New call site/base instruction type needs to be known int the " 4647 "Attributor."); 4648 break; 4649 case Instruction::Load: 4650 // The alignment of a pointer is interesting for loads. 4651 case Instruction::Store: 4652 // The alignment of a pointer is interesting for stores. 4653 case Instruction::Call: 4654 case Instruction::CallBr: 4655 case Instruction::Invoke: 4656 case Instruction::CleanupRet: 4657 case Instruction::CatchSwitch: 4658 case Instruction::Resume: 4659 case Instruction::Ret: 4660 IsInterestingOpcode = true; 4661 } 4662 if (IsInterestingOpcode) 4663 InstOpcodeMap[I.getOpcode()].push_back(&I); 4664 if (I.mayReadOrWriteMemory()) 4665 ReadOrWriteInsts.push_back(&I); 4666 } 4667 } 4668 4669 void Attributor::identifyDefaultAbstractAttributes(Function &F) { 4670 if (!VisitedFunctions.insert(&F).second) 4671 return; 4672 4673 IRPosition FPos = IRPosition::function(F); 4674 4675 // Check for dead BasicBlocks in every function. 4676 // We need dead instruction detection because we do not want to deal with 4677 // broken IR in which SSA rules do not apply. 4678 getOrCreateAAFor<AAIsDead>(FPos); 4679 4680 // Every function might be "will-return". 4681 getOrCreateAAFor<AAWillReturn>(FPos); 4682 4683 // Every function can be nounwind. 4684 getOrCreateAAFor<AANoUnwind>(FPos); 4685 4686 // Every function might be marked "nosync" 4687 getOrCreateAAFor<AANoSync>(FPos); 4688 4689 // Every function might be "no-free". 4690 getOrCreateAAFor<AANoFree>(FPos); 4691 4692 // Every function might be "no-return". 4693 getOrCreateAAFor<AANoReturn>(FPos); 4694 4695 // Every function might be "no-recurse". 4696 getOrCreateAAFor<AANoRecurse>(FPos); 4697 4698 // Every function might be "readnone/readonly/writeonly/...". 4699 getOrCreateAAFor<AAMemoryBehavior>(FPos); 4700 4701 // Every function might be applicable for Heap-To-Stack conversion. 4702 if (EnableHeapToStack) 4703 getOrCreateAAFor<AAHeapToStack>(FPos); 4704 4705 // Return attributes are only appropriate if the return type is non void. 4706 Type *ReturnType = F.getReturnType(); 4707 if (!ReturnType->isVoidTy()) { 4708 // Argument attribute "returned" --- Create only one per function even 4709 // though it is an argument attribute. 4710 getOrCreateAAFor<AAReturnedValues>(FPos); 4711 4712 IRPosition RetPos = IRPosition::returned(F); 4713 4714 // Every function might be simplified. 4715 getOrCreateAAFor<AAValueSimplify>(RetPos); 4716 4717 if (ReturnType->isPointerTy()) { 4718 4719 // Every function with pointer return type might be marked align. 4720 getOrCreateAAFor<AAAlign>(RetPos); 4721 4722 // Every function with pointer return type might be marked nonnull. 4723 getOrCreateAAFor<AANonNull>(RetPos); 4724 4725 // Every function with pointer return type might be marked noalias. 4726 getOrCreateAAFor<AANoAlias>(RetPos); 4727 4728 // Every function with pointer return type might be marked 4729 // dereferenceable. 4730 getOrCreateAAFor<AADereferenceable>(RetPos); 4731 } 4732 } 4733 4734 for (Argument &Arg : F.args()) { 4735 IRPosition ArgPos = IRPosition::argument(Arg); 4736 4737 // Every argument might be simplified. 4738 getOrCreateAAFor<AAValueSimplify>(ArgPos); 4739 4740 if (Arg.getType()->isPointerTy()) { 4741 // Every argument with pointer type might be marked nonnull. 4742 getOrCreateAAFor<AANonNull>(ArgPos); 4743 4744 // Every argument with pointer type might be marked noalias. 4745 getOrCreateAAFor<AANoAlias>(ArgPos); 4746 4747 // Every argument with pointer type might be marked dereferenceable. 4748 getOrCreateAAFor<AADereferenceable>(ArgPos); 4749 4750 // Every argument with pointer type might be marked align. 4751 getOrCreateAAFor<AAAlign>(ArgPos); 4752 4753 // Every argument with pointer type might be marked nocapture. 4754 getOrCreateAAFor<AANoCapture>(ArgPos); 4755 4756 // Every argument with pointer type might be marked 4757 // "readnone/readonly/writeonly/..." 4758 getOrCreateAAFor<AAMemoryBehavior>(ArgPos); 4759 } 4760 } 4761 4762 auto CallSitePred = [&](Instruction &I) -> bool { 4763 CallSite CS(&I); 4764 if (CS.getCalledFunction()) { 4765 for (int i = 0, e = CS.getCalledFunction()->arg_size(); i < e; i++) { 4766 4767 IRPosition CSArgPos = IRPosition::callsite_argument(CS, i); 4768 4769 // Call site argument might be simplified. 4770 getOrCreateAAFor<AAValueSimplify>(CSArgPos); 4771 4772 if (!CS.getArgument(i)->getType()->isPointerTy()) 4773 continue; 4774 4775 // Call site argument attribute "non-null". 4776 getOrCreateAAFor<AANonNull>(CSArgPos); 4777 4778 // Call site argument attribute "no-alias". 4779 getOrCreateAAFor<AANoAlias>(CSArgPos); 4780 4781 // Call site argument attribute "dereferenceable". 4782 getOrCreateAAFor<AADereferenceable>(CSArgPos); 4783 4784 // Call site argument attribute "align". 4785 getOrCreateAAFor<AAAlign>(CSArgPos); 4786 } 4787 } 4788 return true; 4789 }; 4790 4791 auto &OpcodeInstMap = InfoCache.getOpcodeInstMapForFunction(F); 4792 bool Success, AnyDead = false; 4793 Success = checkForAllInstructionsImpl( 4794 OpcodeInstMap, CallSitePred, nullptr, AnyDead, 4795 {(unsigned)Instruction::Invoke, (unsigned)Instruction::CallBr, 4796 (unsigned)Instruction::Call}); 4797 (void)Success; 4798 assert(Success && !AnyDead && "Expected the check call to be successful!"); 4799 4800 auto LoadStorePred = [&](Instruction &I) -> bool { 4801 if (isa<LoadInst>(I)) 4802 getOrCreateAAFor<AAAlign>( 4803 IRPosition::value(*cast<LoadInst>(I).getPointerOperand())); 4804 else 4805 getOrCreateAAFor<AAAlign>( 4806 IRPosition::value(*cast<StoreInst>(I).getPointerOperand())); 4807 return true; 4808 }; 4809 Success = checkForAllInstructionsImpl( 4810 OpcodeInstMap, LoadStorePred, nullptr, AnyDead, 4811 {(unsigned)Instruction::Load, (unsigned)Instruction::Store}); 4812 (void)Success; 4813 assert(Success && !AnyDead && "Expected the check call to be successful!"); 4814 } 4815 4816 /// Helpers to ease debugging through output streams and print calls. 4817 /// 4818 ///{ 4819 raw_ostream &llvm::operator<<(raw_ostream &OS, ChangeStatus S) { 4820 return OS << (S == ChangeStatus::CHANGED ? "changed" : "unchanged"); 4821 } 4822 4823 raw_ostream &llvm::operator<<(raw_ostream &OS, IRPosition::Kind AP) { 4824 switch (AP) { 4825 case IRPosition::IRP_INVALID: 4826 return OS << "inv"; 4827 case IRPosition::IRP_FLOAT: 4828 return OS << "flt"; 4829 case IRPosition::IRP_RETURNED: 4830 return OS << "fn_ret"; 4831 case IRPosition::IRP_CALL_SITE_RETURNED: 4832 return OS << "cs_ret"; 4833 case IRPosition::IRP_FUNCTION: 4834 return OS << "fn"; 4835 case IRPosition::IRP_CALL_SITE: 4836 return OS << "cs"; 4837 case IRPosition::IRP_ARGUMENT: 4838 return OS << "arg"; 4839 case IRPosition::IRP_CALL_SITE_ARGUMENT: 4840 return OS << "cs_arg"; 4841 } 4842 llvm_unreachable("Unknown attribute position!"); 4843 } 4844 4845 raw_ostream &llvm::operator<<(raw_ostream &OS, const IRPosition &Pos) { 4846 const Value &AV = Pos.getAssociatedValue(); 4847 return OS << "{" << Pos.getPositionKind() << ":" << AV.getName() << " [" 4848 << Pos.getAnchorValue().getName() << "@" << Pos.getArgNo() << "]}"; 4849 } 4850 4851 raw_ostream &llvm::operator<<(raw_ostream &OS, const IntegerState &S) { 4852 return OS << "(" << S.getKnown() << "-" << S.getAssumed() << ")" 4853 << static_cast<const AbstractState &>(S); 4854 } 4855 4856 raw_ostream &llvm::operator<<(raw_ostream &OS, const AbstractState &S) { 4857 return OS << (!S.isValidState() ? "top" : (S.isAtFixpoint() ? "fix" : "")); 4858 } 4859 4860 raw_ostream &llvm::operator<<(raw_ostream &OS, const AbstractAttribute &AA) { 4861 AA.print(OS); 4862 return OS; 4863 } 4864 4865 void AbstractAttribute::print(raw_ostream &OS) const { 4866 OS << "[P: " << getIRPosition() << "][" << getAsStr() << "][S: " << getState() 4867 << "]"; 4868 } 4869 ///} 4870 4871 /// ---------------------------------------------------------------------------- 4872 /// Pass (Manager) Boilerplate 4873 /// ---------------------------------------------------------------------------- 4874 4875 static bool runAttributorOnModule(Module &M, AnalysisGetter &AG) { 4876 if (DisableAttributor) 4877 return false; 4878 4879 LLVM_DEBUG(dbgs() << "[Attributor] Run on module with " << M.size() 4880 << " functions.\n"); 4881 4882 // Create an Attributor and initially empty information cache that is filled 4883 // while we identify default attribute opportunities. 4884 InformationCache InfoCache(M, AG); 4885 Attributor A(InfoCache, DepRecInterval); 4886 4887 for (Function &F : M) 4888 A.initializeInformationCache(F); 4889 4890 for (Function &F : M) { 4891 if (F.hasExactDefinition()) 4892 NumFnWithExactDefinition++; 4893 else 4894 NumFnWithoutExactDefinition++; 4895 4896 // We look at internal functions only on-demand but if any use is not a 4897 // direct call, we have to do it eagerly. 4898 if (F.hasLocalLinkage()) { 4899 if (llvm::all_of(F.uses(), [](const Use &U) { 4900 return ImmutableCallSite(U.getUser()) && 4901 ImmutableCallSite(U.getUser()).isCallee(&U); 4902 })) 4903 continue; 4904 } 4905 4906 // Populate the Attributor with abstract attribute opportunities in the 4907 // function and the information cache with IR information. 4908 A.identifyDefaultAbstractAttributes(F); 4909 } 4910 4911 return A.run(M) == ChangeStatus::CHANGED; 4912 } 4913 4914 PreservedAnalyses AttributorPass::run(Module &M, ModuleAnalysisManager &AM) { 4915 AnalysisGetter AG(AM); 4916 if (runAttributorOnModule(M, AG)) { 4917 // FIXME: Think about passes we will preserve and add them here. 4918 return PreservedAnalyses::none(); 4919 } 4920 return PreservedAnalyses::all(); 4921 } 4922 4923 namespace { 4924 4925 struct AttributorLegacyPass : public ModulePass { 4926 static char ID; 4927 4928 AttributorLegacyPass() : ModulePass(ID) { 4929 initializeAttributorLegacyPassPass(*PassRegistry::getPassRegistry()); 4930 } 4931 4932 bool runOnModule(Module &M) override { 4933 if (skipModule(M)) 4934 return false; 4935 4936 AnalysisGetter AG; 4937 return runAttributorOnModule(M, AG); 4938 } 4939 4940 void getAnalysisUsage(AnalysisUsage &AU) const override { 4941 // FIXME: Think about passes we will preserve and add them here. 4942 AU.addRequired<TargetLibraryInfoWrapperPass>(); 4943 } 4944 }; 4945 4946 } // end anonymous namespace 4947 4948 Pass *llvm::createAttributorLegacyPass() { return new AttributorLegacyPass(); } 4949 4950 char AttributorLegacyPass::ID = 0; 4951 4952 const char AAReturnedValues::ID = 0; 4953 const char AANoUnwind::ID = 0; 4954 const char AANoSync::ID = 0; 4955 const char AANoFree::ID = 0; 4956 const char AANonNull::ID = 0; 4957 const char AANoRecurse::ID = 0; 4958 const char AAWillReturn::ID = 0; 4959 const char AANoAlias::ID = 0; 4960 const char AANoReturn::ID = 0; 4961 const char AAIsDead::ID = 0; 4962 const char AADereferenceable::ID = 0; 4963 const char AAAlign::ID = 0; 4964 const char AANoCapture::ID = 0; 4965 const char AAValueSimplify::ID = 0; 4966 const char AAHeapToStack::ID = 0; 4967 const char AAMemoryBehavior::ID = 0; 4968 4969 // Macro magic to create the static generator function for attributes that 4970 // follow the naming scheme. 4971 4972 #define SWITCH_PK_INV(CLASS, PK, POS_NAME) \ 4973 case IRPosition::PK: \ 4974 llvm_unreachable("Cannot create " #CLASS " for a " POS_NAME " position!"); 4975 4976 #define SWITCH_PK_CREATE(CLASS, IRP, PK, SUFFIX) \ 4977 case IRPosition::PK: \ 4978 AA = new CLASS##SUFFIX(IRP); \ 4979 break; 4980 4981 #define CREATE_FUNCTION_ABSTRACT_ATTRIBUTE_FOR_POSITION(CLASS) \ 4982 CLASS &CLASS::createForPosition(const IRPosition &IRP, Attributor &A) { \ 4983 CLASS *AA = nullptr; \ 4984 switch (IRP.getPositionKind()) { \ 4985 SWITCH_PK_INV(CLASS, IRP_INVALID, "invalid") \ 4986 SWITCH_PK_INV(CLASS, IRP_FLOAT, "floating") \ 4987 SWITCH_PK_INV(CLASS, IRP_ARGUMENT, "argument") \ 4988 SWITCH_PK_INV(CLASS, IRP_RETURNED, "returned") \ 4989 SWITCH_PK_INV(CLASS, IRP_CALL_SITE_RETURNED, "call site returned") \ 4990 SWITCH_PK_INV(CLASS, IRP_CALL_SITE_ARGUMENT, "call site argument") \ 4991 SWITCH_PK_CREATE(CLASS, IRP, IRP_FUNCTION, Function) \ 4992 SWITCH_PK_CREATE(CLASS, IRP, IRP_CALL_SITE, CallSite) \ 4993 } \ 4994 return *AA; \ 4995 } 4996 4997 #define CREATE_VALUE_ABSTRACT_ATTRIBUTE_FOR_POSITION(CLASS) \ 4998 CLASS &CLASS::createForPosition(const IRPosition &IRP, Attributor &A) { \ 4999 CLASS *AA = nullptr; \ 5000 switch (IRP.getPositionKind()) { \ 5001 SWITCH_PK_INV(CLASS, IRP_INVALID, "invalid") \ 5002 SWITCH_PK_INV(CLASS, IRP_FUNCTION, "function") \ 5003 SWITCH_PK_INV(CLASS, IRP_CALL_SITE, "call site") \ 5004 SWITCH_PK_CREATE(CLASS, IRP, IRP_FLOAT, Floating) \ 5005 SWITCH_PK_CREATE(CLASS, IRP, IRP_ARGUMENT, Argument) \ 5006 SWITCH_PK_CREATE(CLASS, IRP, IRP_RETURNED, Returned) \ 5007 SWITCH_PK_CREATE(CLASS, IRP, IRP_CALL_SITE_RETURNED, CallSiteReturned) \ 5008 SWITCH_PK_CREATE(CLASS, IRP, IRP_CALL_SITE_ARGUMENT, CallSiteArgument) \ 5009 } \ 5010 return *AA; \ 5011 } 5012 5013 #define CREATE_ALL_ABSTRACT_ATTRIBUTE_FOR_POSITION(CLASS) \ 5014 CLASS &CLASS::createForPosition(const IRPosition &IRP, Attributor &A) { \ 5015 CLASS *AA = nullptr; \ 5016 switch (IRP.getPositionKind()) { \ 5017 SWITCH_PK_INV(CLASS, IRP_INVALID, "invalid") \ 5018 SWITCH_PK_CREATE(CLASS, IRP, IRP_FUNCTION, Function) \ 5019 SWITCH_PK_CREATE(CLASS, IRP, IRP_CALL_SITE, CallSite) \ 5020 SWITCH_PK_CREATE(CLASS, IRP, IRP_FLOAT, Floating) \ 5021 SWITCH_PK_CREATE(CLASS, IRP, IRP_ARGUMENT, Argument) \ 5022 SWITCH_PK_CREATE(CLASS, IRP, IRP_RETURNED, Returned) \ 5023 SWITCH_PK_CREATE(CLASS, IRP, IRP_CALL_SITE_RETURNED, CallSiteReturned) \ 5024 SWITCH_PK_CREATE(CLASS, IRP, IRP_CALL_SITE_ARGUMENT, CallSiteArgument) \ 5025 } \ 5026 return *AA; \ 5027 } 5028 5029 #define CREATE_FUNCTION_ONLY_ABSTRACT_ATTRIBUTE_FOR_POSITION(CLASS) \ 5030 CLASS &CLASS::createForPosition(const IRPosition &IRP, Attributor &A) { \ 5031 CLASS *AA = nullptr; \ 5032 switch (IRP.getPositionKind()) { \ 5033 SWITCH_PK_INV(CLASS, IRP_INVALID, "invalid") \ 5034 SWITCH_PK_INV(CLASS, IRP_ARGUMENT, "argument") \ 5035 SWITCH_PK_INV(CLASS, IRP_FLOAT, "floating") \ 5036 SWITCH_PK_INV(CLASS, IRP_RETURNED, "returned") \ 5037 SWITCH_PK_INV(CLASS, IRP_CALL_SITE_RETURNED, "call site returned") \ 5038 SWITCH_PK_INV(CLASS, IRP_CALL_SITE_ARGUMENT, "call site argument") \ 5039 SWITCH_PK_INV(CLASS, IRP_CALL_SITE, "call site") \ 5040 SWITCH_PK_CREATE(CLASS, IRP, IRP_FUNCTION, Function) \ 5041 } \ 5042 return *AA; \ 5043 } 5044 5045 #define CREATE_NON_RET_ABSTRACT_ATTRIBUTE_FOR_POSITION(CLASS) \ 5046 CLASS &CLASS::createForPosition(const IRPosition &IRP, Attributor &A) { \ 5047 CLASS *AA = nullptr; \ 5048 switch (IRP.getPositionKind()) { \ 5049 SWITCH_PK_INV(CLASS, IRP_INVALID, "invalid") \ 5050 SWITCH_PK_INV(CLASS, IRP_RETURNED, "returned") \ 5051 SWITCH_PK_CREATE(CLASS, IRP, IRP_FUNCTION, Function) \ 5052 SWITCH_PK_CREATE(CLASS, IRP, IRP_CALL_SITE, CallSite) \ 5053 SWITCH_PK_CREATE(CLASS, IRP, IRP_FLOAT, Floating) \ 5054 SWITCH_PK_CREATE(CLASS, IRP, IRP_ARGUMENT, Argument) \ 5055 SWITCH_PK_CREATE(CLASS, IRP, IRP_CALL_SITE_RETURNED, CallSiteReturned) \ 5056 SWITCH_PK_CREATE(CLASS, IRP, IRP_CALL_SITE_ARGUMENT, CallSiteArgument) \ 5057 } \ 5058 return *AA; \ 5059 } 5060 5061 CREATE_FUNCTION_ABSTRACT_ATTRIBUTE_FOR_POSITION(AANoUnwind) 5062 CREATE_FUNCTION_ABSTRACT_ATTRIBUTE_FOR_POSITION(AANoSync) 5063 CREATE_FUNCTION_ABSTRACT_ATTRIBUTE_FOR_POSITION(AANoFree) 5064 CREATE_FUNCTION_ABSTRACT_ATTRIBUTE_FOR_POSITION(AANoRecurse) 5065 CREATE_FUNCTION_ABSTRACT_ATTRIBUTE_FOR_POSITION(AAWillReturn) 5066 CREATE_FUNCTION_ABSTRACT_ATTRIBUTE_FOR_POSITION(AANoReturn) 5067 CREATE_FUNCTION_ABSTRACT_ATTRIBUTE_FOR_POSITION(AAIsDead) 5068 CREATE_FUNCTION_ABSTRACT_ATTRIBUTE_FOR_POSITION(AAReturnedValues) 5069 5070 CREATE_VALUE_ABSTRACT_ATTRIBUTE_FOR_POSITION(AANonNull) 5071 CREATE_VALUE_ABSTRACT_ATTRIBUTE_FOR_POSITION(AANoAlias) 5072 CREATE_VALUE_ABSTRACT_ATTRIBUTE_FOR_POSITION(AADereferenceable) 5073 CREATE_VALUE_ABSTRACT_ATTRIBUTE_FOR_POSITION(AAAlign) 5074 CREATE_VALUE_ABSTRACT_ATTRIBUTE_FOR_POSITION(AANoCapture) 5075 5076 CREATE_ALL_ABSTRACT_ATTRIBUTE_FOR_POSITION(AAValueSimplify) 5077 5078 CREATE_FUNCTION_ONLY_ABSTRACT_ATTRIBUTE_FOR_POSITION(AAHeapToStack) 5079 5080 CREATE_NON_RET_ABSTRACT_ATTRIBUTE_FOR_POSITION(AAMemoryBehavior) 5081 5082 #undef CREATE_FUNCTION_ONLY_ABSTRACT_ATTRIBUTE_FOR_POSITION 5083 #undef CREATE_FUNCTION_ABSTRACT_ATTRIBUTE_FOR_POSITION 5084 #undef CREATE_NON_RET_ABSTRACT_ATTRIBUTE_FOR_POSITION 5085 #undef CREATE_VALUE_ABSTRACT_ATTRIBUTE_FOR_POSITION 5086 #undef CREATE_ALL_ABSTRACT_ATTRIBUTE_FOR_POSITION 5087 #undef SWITCH_PK_CREATE 5088 #undef SWITCH_PK_INV 5089 5090 INITIALIZE_PASS_BEGIN(AttributorLegacyPass, "attributor", 5091 "Deduce and propagate attributes", false, false) 5092 INITIALIZE_PASS_DEPENDENCY(TargetLibraryInfoWrapperPass) 5093 INITIALIZE_PASS_END(AttributorLegacyPass, "attributor", 5094 "Deduce and propagate attributes", false, false) 5095