1 //===--- CGExprAgg.cpp - Emit LLVM Code from Aggregate Expressions --------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This contains code to emit Aggregate Expr nodes as LLVM code.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "CodeGenFunction.h"
15 #include "CodeGenModule.h"
16 #include "CGObjCRuntime.h"
17 #include "clang/AST/ASTContext.h"
18 #include "clang/AST/DeclCXX.h"
19 #include "clang/AST/StmtVisitor.h"
20 #include "llvm/Constants.h"
21 #include "llvm/Function.h"
22 #include "llvm/GlobalVariable.h"
23 #include "llvm/Intrinsics.h"
24 using namespace clang;
25 using namespace CodeGen;
26 
27 //===----------------------------------------------------------------------===//
28 //                        Aggregate Expression Emitter
29 //===----------------------------------------------------------------------===//
30 
31 namespace  {
32 class AggExprEmitter : public StmtVisitor<AggExprEmitter> {
33   CodeGenFunction &CGF;
34   CGBuilderTy &Builder;
35   AggValueSlot Dest;
36   bool IgnoreResult;
37 
38   /// We want to use 'dest' as the return slot except under two
39   /// conditions:
40   ///   - The destination slot requires garbage collection, so we
41   ///     need to use the GC API.
42   ///   - The destination slot is potentially aliased.
43   bool shouldUseDestForReturnSlot() const {
44     return !(Dest.requiresGCollection() || Dest.isPotentiallyAliased());
45   }
46 
47   ReturnValueSlot getReturnValueSlot() const {
48     if (!shouldUseDestForReturnSlot())
49       return ReturnValueSlot();
50 
51     return ReturnValueSlot(Dest.getAddr(), Dest.isVolatile());
52   }
53 
54   AggValueSlot EnsureSlot(QualType T) {
55     if (!Dest.isIgnored()) return Dest;
56     return CGF.CreateAggTemp(T, "agg.tmp.ensured");
57   }
58 
59 public:
60   AggExprEmitter(CodeGenFunction &cgf, AggValueSlot Dest,
61                  bool ignore)
62     : CGF(cgf), Builder(CGF.Builder), Dest(Dest),
63       IgnoreResult(ignore) {
64   }
65 
66   //===--------------------------------------------------------------------===//
67   //                               Utilities
68   //===--------------------------------------------------------------------===//
69 
70   /// EmitAggLoadOfLValue - Given an expression with aggregate type that
71   /// represents a value lvalue, this method emits the address of the lvalue,
72   /// then loads the result into DestPtr.
73   void EmitAggLoadOfLValue(const Expr *E);
74 
75   /// EmitFinalDestCopy - Perform the final copy to DestPtr, if desired.
76   void EmitFinalDestCopy(const Expr *E, LValue Src, bool Ignore = false);
77   void EmitFinalDestCopy(const Expr *E, RValue Src, bool Ignore = false);
78 
79   void EmitMoveFromReturnSlot(const Expr *E, RValue Src);
80 
81   AggValueSlot::NeedsGCBarriers_t needsGC(QualType T) {
82     if (CGF.getLangOptions().getGCMode() && TypeRequiresGCollection(T))
83       return AggValueSlot::NeedsGCBarriers;
84     return AggValueSlot::DoesNotNeedGCBarriers;
85   }
86 
87   bool TypeRequiresGCollection(QualType T);
88 
89   //===--------------------------------------------------------------------===//
90   //                            Visitor Methods
91   //===--------------------------------------------------------------------===//
92 
93   void VisitStmt(Stmt *S) {
94     CGF.ErrorUnsupported(S, "aggregate expression");
95   }
96   void VisitParenExpr(ParenExpr *PE) { Visit(PE->getSubExpr()); }
97   void VisitGenericSelectionExpr(GenericSelectionExpr *GE) {
98     Visit(GE->getResultExpr());
99   }
100   void VisitUnaryExtension(UnaryOperator *E) { Visit(E->getSubExpr()); }
101   void VisitSubstNonTypeTemplateParmExpr(SubstNonTypeTemplateParmExpr *E) {
102     return Visit(E->getReplacement());
103   }
104 
105   // l-values.
106   void VisitDeclRefExpr(DeclRefExpr *DRE) { EmitAggLoadOfLValue(DRE); }
107   void VisitMemberExpr(MemberExpr *ME) { EmitAggLoadOfLValue(ME); }
108   void VisitUnaryDeref(UnaryOperator *E) { EmitAggLoadOfLValue(E); }
109   void VisitStringLiteral(StringLiteral *E) { EmitAggLoadOfLValue(E); }
110   void VisitCompoundLiteralExpr(CompoundLiteralExpr *E);
111   void VisitArraySubscriptExpr(ArraySubscriptExpr *E) {
112     EmitAggLoadOfLValue(E);
113   }
114   void VisitBlockDeclRefExpr(const BlockDeclRefExpr *E) {
115     EmitAggLoadOfLValue(E);
116   }
117   void VisitPredefinedExpr(const PredefinedExpr *E) {
118     EmitAggLoadOfLValue(E);
119   }
120 
121   // Operators.
122   void VisitCastExpr(CastExpr *E);
123   void VisitCallExpr(const CallExpr *E);
124   void VisitStmtExpr(const StmtExpr *E);
125   void VisitBinaryOperator(const BinaryOperator *BO);
126   void VisitPointerToDataMemberBinaryOperator(const BinaryOperator *BO);
127   void VisitBinAssign(const BinaryOperator *E);
128   void VisitBinComma(const BinaryOperator *E);
129 
130   void VisitObjCMessageExpr(ObjCMessageExpr *E);
131   void VisitObjCIvarRefExpr(ObjCIvarRefExpr *E) {
132     EmitAggLoadOfLValue(E);
133   }
134   void VisitObjCPropertyRefExpr(ObjCPropertyRefExpr *E);
135 
136   void VisitAbstractConditionalOperator(const AbstractConditionalOperator *CO);
137   void VisitChooseExpr(const ChooseExpr *CE);
138   void VisitInitListExpr(InitListExpr *E);
139   void VisitImplicitValueInitExpr(ImplicitValueInitExpr *E);
140   void VisitCXXDefaultArgExpr(CXXDefaultArgExpr *DAE) {
141     Visit(DAE->getExpr());
142   }
143   void VisitCXXBindTemporaryExpr(CXXBindTemporaryExpr *E);
144   void VisitCXXConstructExpr(const CXXConstructExpr *E);
145   void VisitExprWithCleanups(ExprWithCleanups *E);
146   void VisitCXXScalarValueInitExpr(CXXScalarValueInitExpr *E);
147   void VisitCXXTypeidExpr(CXXTypeidExpr *E) { EmitAggLoadOfLValue(E); }
148   void VisitMaterializeTemporaryExpr(MaterializeTemporaryExpr *E);
149   void VisitOpaqueValueExpr(OpaqueValueExpr *E);
150 
151   void VisitVAArgExpr(VAArgExpr *E);
152 
153   void EmitInitializationToLValue(Expr *E, LValue Address);
154   void EmitNullInitializationToLValue(LValue Address);
155   //  case Expr::ChooseExprClass:
156   void VisitCXXThrowExpr(const CXXThrowExpr *E) { CGF.EmitCXXThrowExpr(E); }
157 };
158 }  // end anonymous namespace.
159 
160 //===----------------------------------------------------------------------===//
161 //                                Utilities
162 //===----------------------------------------------------------------------===//
163 
164 /// EmitAggLoadOfLValue - Given an expression with aggregate type that
165 /// represents a value lvalue, this method emits the address of the lvalue,
166 /// then loads the result into DestPtr.
167 void AggExprEmitter::EmitAggLoadOfLValue(const Expr *E) {
168   LValue LV = CGF.EmitLValue(E);
169   EmitFinalDestCopy(E, LV);
170 }
171 
172 /// \brief True if the given aggregate type requires special GC API calls.
173 bool AggExprEmitter::TypeRequiresGCollection(QualType T) {
174   // Only record types have members that might require garbage collection.
175   const RecordType *RecordTy = T->getAs<RecordType>();
176   if (!RecordTy) return false;
177 
178   // Don't mess with non-trivial C++ types.
179   RecordDecl *Record = RecordTy->getDecl();
180   if (isa<CXXRecordDecl>(Record) &&
181       (!cast<CXXRecordDecl>(Record)->hasTrivialCopyConstructor() ||
182        !cast<CXXRecordDecl>(Record)->hasTrivialDestructor()))
183     return false;
184 
185   // Check whether the type has an object member.
186   return Record->hasObjectMember();
187 }
188 
189 /// \brief Perform the final move to DestPtr if for some reason
190 /// getReturnValueSlot() didn't use it directly.
191 ///
192 /// The idea is that you do something like this:
193 ///   RValue Result = EmitSomething(..., getReturnValueSlot());
194 ///   EmitMoveFromReturnSlot(E, Result);
195 ///
196 /// If nothing interferes, this will cause the result to be emitted
197 /// directly into the return value slot.  Otherwise, a final move
198 /// will be performed.
199 void AggExprEmitter::EmitMoveFromReturnSlot(const Expr *E, RValue Src) {
200   if (shouldUseDestForReturnSlot()) {
201     // Logically, Dest.getAddr() should equal Src.getAggregateAddr().
202     // The possibility of undef rvalues complicates that a lot,
203     // though, so we can't really assert.
204     return;
205   }
206 
207   // Otherwise, do a final copy,
208   assert(Dest.getAddr() != Src.getAggregateAddr());
209   EmitFinalDestCopy(E, Src, /*Ignore*/ true);
210 }
211 
212 /// EmitFinalDestCopy - Perform the final copy to DestPtr, if desired.
213 void AggExprEmitter::EmitFinalDestCopy(const Expr *E, RValue Src, bool Ignore) {
214   assert(Src.isAggregate() && "value must be aggregate value!");
215 
216   // If Dest is ignored, then we're evaluating an aggregate expression
217   // in a context (like an expression statement) that doesn't care
218   // about the result.  C says that an lvalue-to-rvalue conversion is
219   // performed in these cases; C++ says that it is not.  In either
220   // case, we don't actually need to do anything unless the value is
221   // volatile.
222   if (Dest.isIgnored()) {
223     if (!Src.isVolatileQualified() ||
224         CGF.CGM.getLangOptions().CPlusPlus ||
225         (IgnoreResult && Ignore))
226       return;
227 
228     // If the source is volatile, we must read from it; to do that, we need
229     // some place to put it.
230     Dest = CGF.CreateAggTemp(E->getType(), "agg.tmp");
231   }
232 
233   if (Dest.requiresGCollection()) {
234     CharUnits size = CGF.getContext().getTypeSizeInChars(E->getType());
235     llvm::Type *SizeTy = CGF.ConvertType(CGF.getContext().getSizeType());
236     llvm::Value *SizeVal = llvm::ConstantInt::get(SizeTy, size.getQuantity());
237     CGF.CGM.getObjCRuntime().EmitGCMemmoveCollectable(CGF,
238                                                       Dest.getAddr(),
239                                                       Src.getAggregateAddr(),
240                                                       SizeVal);
241     return;
242   }
243   // If the result of the assignment is used, copy the LHS there also.
244   // FIXME: Pass VolatileDest as well.  I think we also need to merge volatile
245   // from the source as well, as we can't eliminate it if either operand
246   // is volatile, unless copy has volatile for both source and destination..
247   CGF.EmitAggregateCopy(Dest.getAddr(), Src.getAggregateAddr(), E->getType(),
248                         Dest.isVolatile()|Src.isVolatileQualified());
249 }
250 
251 /// EmitFinalDestCopy - Perform the final copy to DestPtr, if desired.
252 void AggExprEmitter::EmitFinalDestCopy(const Expr *E, LValue Src, bool Ignore) {
253   assert(Src.isSimple() && "Can't have aggregate bitfield, vector, etc");
254 
255   EmitFinalDestCopy(E, RValue::getAggregate(Src.getAddress(),
256                                             Src.isVolatileQualified()),
257                     Ignore);
258 }
259 
260 //===----------------------------------------------------------------------===//
261 //                            Visitor Methods
262 //===----------------------------------------------------------------------===//
263 
264 void AggExprEmitter::VisitMaterializeTemporaryExpr(MaterializeTemporaryExpr *E){
265   Visit(E->GetTemporaryExpr());
266 }
267 
268 void AggExprEmitter::VisitOpaqueValueExpr(OpaqueValueExpr *e) {
269   EmitFinalDestCopy(e, CGF.getOpaqueLValueMapping(e));
270 }
271 
272 void
273 AggExprEmitter::VisitCompoundLiteralExpr(CompoundLiteralExpr *E) {
274   if (E->getType().isPODType(CGF.getContext())) {
275     // For a POD type, just emit a load of the lvalue + a copy, because our
276     // compound literal might alias the destination.
277     // FIXME: This is a band-aid; the real problem appears to be in our handling
278     // of assignments, where we store directly into the LHS without checking
279     // whether anything in the RHS aliases.
280     EmitAggLoadOfLValue(E);
281     return;
282   }
283 
284   AggValueSlot Slot = EnsureSlot(E->getType());
285   CGF.EmitAggExpr(E->getInitializer(), Slot);
286 }
287 
288 
289 void AggExprEmitter::VisitCastExpr(CastExpr *E) {
290   switch (E->getCastKind()) {
291   case CK_Dynamic: {
292     assert(isa<CXXDynamicCastExpr>(E) && "CK_Dynamic without a dynamic_cast?");
293     LValue LV = CGF.EmitCheckedLValue(E->getSubExpr());
294     // FIXME: Do we also need to handle property references here?
295     if (LV.isSimple())
296       CGF.EmitDynamicCast(LV.getAddress(), cast<CXXDynamicCastExpr>(E));
297     else
298       CGF.CGM.ErrorUnsupported(E, "non-simple lvalue dynamic_cast");
299 
300     if (!Dest.isIgnored())
301       CGF.CGM.ErrorUnsupported(E, "lvalue dynamic_cast with a destination");
302     break;
303   }
304 
305   case CK_ToUnion: {
306     if (Dest.isIgnored()) break;
307 
308     // GCC union extension
309     QualType Ty = E->getSubExpr()->getType();
310     QualType PtrTy = CGF.getContext().getPointerType(Ty);
311     llvm::Value *CastPtr = Builder.CreateBitCast(Dest.getAddr(),
312                                                  CGF.ConvertType(PtrTy));
313     EmitInitializationToLValue(E->getSubExpr(),
314                                CGF.MakeAddrLValue(CastPtr, Ty));
315     break;
316   }
317 
318   case CK_DerivedToBase:
319   case CK_BaseToDerived:
320   case CK_UncheckedDerivedToBase: {
321     assert(0 && "cannot perform hierarchy conversion in EmitAggExpr: "
322                 "should have been unpacked before we got here");
323     break;
324   }
325 
326   case CK_GetObjCProperty: {
327     LValue LV = CGF.EmitLValue(E->getSubExpr());
328     assert(LV.isPropertyRef());
329     RValue RV = CGF.EmitLoadOfPropertyRefLValue(LV, getReturnValueSlot());
330     EmitMoveFromReturnSlot(E, RV);
331     break;
332   }
333 
334   case CK_LValueToRValue: // hope for downstream optimization
335   case CK_NoOp:
336   case CK_UserDefinedConversion:
337   case CK_ConstructorConversion:
338     assert(CGF.getContext().hasSameUnqualifiedType(E->getSubExpr()->getType(),
339                                                    E->getType()) &&
340            "Implicit cast types must be compatible");
341     Visit(E->getSubExpr());
342     break;
343 
344   case CK_LValueBitCast:
345     llvm_unreachable("should not be emitting lvalue bitcast as rvalue");
346     break;
347 
348   case CK_Dependent:
349   case CK_BitCast:
350   case CK_ArrayToPointerDecay:
351   case CK_FunctionToPointerDecay:
352   case CK_NullToPointer:
353   case CK_NullToMemberPointer:
354   case CK_BaseToDerivedMemberPointer:
355   case CK_DerivedToBaseMemberPointer:
356   case CK_MemberPointerToBoolean:
357   case CK_IntegralToPointer:
358   case CK_PointerToIntegral:
359   case CK_PointerToBoolean:
360   case CK_ToVoid:
361   case CK_VectorSplat:
362   case CK_IntegralCast:
363   case CK_IntegralToBoolean:
364   case CK_IntegralToFloating:
365   case CK_FloatingToIntegral:
366   case CK_FloatingToBoolean:
367   case CK_FloatingCast:
368   case CK_CPointerToObjCPointerCast:
369   case CK_BlockPointerToObjCPointerCast:
370   case CK_AnyPointerToBlockPointerCast:
371   case CK_ObjCObjectLValueCast:
372   case CK_FloatingRealToComplex:
373   case CK_FloatingComplexToReal:
374   case CK_FloatingComplexToBoolean:
375   case CK_FloatingComplexCast:
376   case CK_FloatingComplexToIntegralComplex:
377   case CK_IntegralRealToComplex:
378   case CK_IntegralComplexToReal:
379   case CK_IntegralComplexToBoolean:
380   case CK_IntegralComplexCast:
381   case CK_IntegralComplexToFloatingComplex:
382   case CK_ObjCProduceObject:
383   case CK_ObjCConsumeObject:
384   case CK_ObjCReclaimReturnedObject:
385     llvm_unreachable("cast kind invalid for aggregate types");
386   }
387 }
388 
389 void AggExprEmitter::VisitCallExpr(const CallExpr *E) {
390   if (E->getCallReturnType()->isReferenceType()) {
391     EmitAggLoadOfLValue(E);
392     return;
393   }
394 
395   RValue RV = CGF.EmitCallExpr(E, getReturnValueSlot());
396   EmitMoveFromReturnSlot(E, RV);
397 }
398 
399 void AggExprEmitter::VisitObjCMessageExpr(ObjCMessageExpr *E) {
400   RValue RV = CGF.EmitObjCMessageExpr(E, getReturnValueSlot());
401   EmitMoveFromReturnSlot(E, RV);
402 }
403 
404 void AggExprEmitter::VisitObjCPropertyRefExpr(ObjCPropertyRefExpr *E) {
405   llvm_unreachable("direct property access not surrounded by "
406                    "lvalue-to-rvalue cast");
407 }
408 
409 void AggExprEmitter::VisitBinComma(const BinaryOperator *E) {
410   CGF.EmitIgnoredExpr(E->getLHS());
411   Visit(E->getRHS());
412 }
413 
414 void AggExprEmitter::VisitStmtExpr(const StmtExpr *E) {
415   CodeGenFunction::StmtExprEvaluation eval(CGF);
416   CGF.EmitCompoundStmt(*E->getSubStmt(), true, Dest);
417 }
418 
419 void AggExprEmitter::VisitBinaryOperator(const BinaryOperator *E) {
420   if (E->getOpcode() == BO_PtrMemD || E->getOpcode() == BO_PtrMemI)
421     VisitPointerToDataMemberBinaryOperator(E);
422   else
423     CGF.ErrorUnsupported(E, "aggregate binary expression");
424 }
425 
426 void AggExprEmitter::VisitPointerToDataMemberBinaryOperator(
427                                                     const BinaryOperator *E) {
428   LValue LV = CGF.EmitPointerToDataMemberBinaryExpr(E);
429   EmitFinalDestCopy(E, LV);
430 }
431 
432 void AggExprEmitter::VisitBinAssign(const BinaryOperator *E) {
433   // For an assignment to work, the value on the right has
434   // to be compatible with the value on the left.
435   assert(CGF.getContext().hasSameUnqualifiedType(E->getLHS()->getType(),
436                                                  E->getRHS()->getType())
437          && "Invalid assignment");
438 
439   if (const DeclRefExpr *DRE = dyn_cast<DeclRefExpr>(E->getLHS()))
440     if (const VarDecl *VD = dyn_cast<VarDecl>(DRE->getDecl()))
441       if (VD->hasAttr<BlocksAttr>() &&
442           E->getRHS()->HasSideEffects(CGF.getContext())) {
443         // When __block variable on LHS, the RHS must be evaluated first
444         // as it may change the 'forwarding' field via call to Block_copy.
445         LValue RHS = CGF.EmitLValue(E->getRHS());
446         LValue LHS = CGF.EmitLValue(E->getLHS());
447         Dest = AggValueSlot::forLValue(LHS, AggValueSlot::IsDestructed,
448                                        needsGC(E->getLHS()->getType()),
449                                        AggValueSlot::IsAliased);
450         EmitFinalDestCopy(E, RHS, true);
451         return;
452       }
453 
454   LValue LHS = CGF.EmitLValue(E->getLHS());
455 
456   // We have to special case property setters, otherwise we must have
457   // a simple lvalue (no aggregates inside vectors, bitfields).
458   if (LHS.isPropertyRef()) {
459     const ObjCPropertyRefExpr *RE = LHS.getPropertyRefExpr();
460     QualType ArgType = RE->getSetterArgType();
461     RValue Src;
462     if (ArgType->isReferenceType())
463       Src = CGF.EmitReferenceBindingToExpr(E->getRHS(), 0);
464     else {
465       AggValueSlot Slot = EnsureSlot(E->getRHS()->getType());
466       CGF.EmitAggExpr(E->getRHS(), Slot);
467       Src = Slot.asRValue();
468     }
469     CGF.EmitStoreThroughPropertyRefLValue(Src, LHS);
470   } else {
471     // Codegen the RHS so that it stores directly into the LHS.
472     AggValueSlot LHSSlot =
473       AggValueSlot::forLValue(LHS, AggValueSlot::IsDestructed,
474                               needsGC(E->getLHS()->getType()),
475                               AggValueSlot::IsAliased);
476     CGF.EmitAggExpr(E->getRHS(), LHSSlot, false);
477     EmitFinalDestCopy(E, LHS, true);
478   }
479 }
480 
481 void AggExprEmitter::
482 VisitAbstractConditionalOperator(const AbstractConditionalOperator *E) {
483   llvm::BasicBlock *LHSBlock = CGF.createBasicBlock("cond.true");
484   llvm::BasicBlock *RHSBlock = CGF.createBasicBlock("cond.false");
485   llvm::BasicBlock *ContBlock = CGF.createBasicBlock("cond.end");
486 
487   // Bind the common expression if necessary.
488   CodeGenFunction::OpaqueValueMapping binding(CGF, E);
489 
490   CodeGenFunction::ConditionalEvaluation eval(CGF);
491   CGF.EmitBranchOnBoolExpr(E->getCond(), LHSBlock, RHSBlock);
492 
493   // Save whether the destination's lifetime is externally managed.
494   bool isExternallyDestructed = Dest.isExternallyDestructed();
495 
496   eval.begin(CGF);
497   CGF.EmitBlock(LHSBlock);
498   Visit(E->getTrueExpr());
499   eval.end(CGF);
500 
501   assert(CGF.HaveInsertPoint() && "expression evaluation ended with no IP!");
502   CGF.Builder.CreateBr(ContBlock);
503 
504   // If the result of an agg expression is unused, then the emission
505   // of the LHS might need to create a destination slot.  That's fine
506   // with us, and we can safely emit the RHS into the same slot, but
507   // we shouldn't claim that it's already being destructed.
508   Dest.setExternallyDestructed(isExternallyDestructed);
509 
510   eval.begin(CGF);
511   CGF.EmitBlock(RHSBlock);
512   Visit(E->getFalseExpr());
513   eval.end(CGF);
514 
515   CGF.EmitBlock(ContBlock);
516 }
517 
518 void AggExprEmitter::VisitChooseExpr(const ChooseExpr *CE) {
519   Visit(CE->getChosenSubExpr(CGF.getContext()));
520 }
521 
522 void AggExprEmitter::VisitVAArgExpr(VAArgExpr *VE) {
523   llvm::Value *ArgValue = CGF.EmitVAListRef(VE->getSubExpr());
524   llvm::Value *ArgPtr = CGF.EmitVAArg(ArgValue, VE->getType());
525 
526   if (!ArgPtr) {
527     CGF.ErrorUnsupported(VE, "aggregate va_arg expression");
528     return;
529   }
530 
531   EmitFinalDestCopy(VE, CGF.MakeAddrLValue(ArgPtr, VE->getType()));
532 }
533 
534 void AggExprEmitter::VisitCXXBindTemporaryExpr(CXXBindTemporaryExpr *E) {
535   // Ensure that we have a slot, but if we already do, remember
536   // whether it was externally destructed.
537   bool wasExternallyDestructed = Dest.isExternallyDestructed();
538   Dest = EnsureSlot(E->getType());
539 
540   // We're going to push a destructor if there isn't already one.
541   Dest.setExternallyDestructed();
542 
543   Visit(E->getSubExpr());
544 
545   // Push that destructor we promised.
546   if (!wasExternallyDestructed)
547     CGF.EmitCXXTemporary(E->getTemporary(), Dest.getAddr());
548 }
549 
550 void
551 AggExprEmitter::VisitCXXConstructExpr(const CXXConstructExpr *E) {
552   AggValueSlot Slot = EnsureSlot(E->getType());
553   CGF.EmitCXXConstructExpr(E, Slot);
554 }
555 
556 void AggExprEmitter::VisitExprWithCleanups(ExprWithCleanups *E) {
557   CGF.EmitExprWithCleanups(E, Dest);
558 }
559 
560 void AggExprEmitter::VisitCXXScalarValueInitExpr(CXXScalarValueInitExpr *E) {
561   QualType T = E->getType();
562   AggValueSlot Slot = EnsureSlot(T);
563   EmitNullInitializationToLValue(CGF.MakeAddrLValue(Slot.getAddr(), T));
564 }
565 
566 void AggExprEmitter::VisitImplicitValueInitExpr(ImplicitValueInitExpr *E) {
567   QualType T = E->getType();
568   AggValueSlot Slot = EnsureSlot(T);
569   EmitNullInitializationToLValue(CGF.MakeAddrLValue(Slot.getAddr(), T));
570 }
571 
572 /// isSimpleZero - If emitting this value will obviously just cause a store of
573 /// zero to memory, return true.  This can return false if uncertain, so it just
574 /// handles simple cases.
575 static bool isSimpleZero(const Expr *E, CodeGenFunction &CGF) {
576   E = E->IgnoreParens();
577 
578   // 0
579   if (const IntegerLiteral *IL = dyn_cast<IntegerLiteral>(E))
580     return IL->getValue() == 0;
581   // +0.0
582   if (const FloatingLiteral *FL = dyn_cast<FloatingLiteral>(E))
583     return FL->getValue().isPosZero();
584   // int()
585   if ((isa<ImplicitValueInitExpr>(E) || isa<CXXScalarValueInitExpr>(E)) &&
586       CGF.getTypes().isZeroInitializable(E->getType()))
587     return true;
588   // (int*)0 - Null pointer expressions.
589   if (const CastExpr *ICE = dyn_cast<CastExpr>(E))
590     return ICE->getCastKind() == CK_NullToPointer;
591   // '\0'
592   if (const CharacterLiteral *CL = dyn_cast<CharacterLiteral>(E))
593     return CL->getValue() == 0;
594 
595   // Otherwise, hard case: conservatively return false.
596   return false;
597 }
598 
599 
600 void
601 AggExprEmitter::EmitInitializationToLValue(Expr* E, LValue LV) {
602   QualType type = LV.getType();
603   // FIXME: Ignore result?
604   // FIXME: Are initializers affected by volatile?
605   if (Dest.isZeroed() && isSimpleZero(E, CGF)) {
606     // Storing "i32 0" to a zero'd memory location is a noop.
607   } else if (isa<ImplicitValueInitExpr>(E)) {
608     EmitNullInitializationToLValue(LV);
609   } else if (type->isReferenceType()) {
610     RValue RV = CGF.EmitReferenceBindingToExpr(E, /*InitializedDecl=*/0);
611     CGF.EmitStoreThroughLValue(RV, LV);
612   } else if (type->isAnyComplexType()) {
613     CGF.EmitComplexExprIntoAddr(E, LV.getAddress(), false);
614   } else if (CGF.hasAggregateLLVMType(type)) {
615     CGF.EmitAggExpr(E, AggValueSlot::forLValue(LV,
616                                                AggValueSlot::IsDestructed,
617                                       AggValueSlot::DoesNotNeedGCBarriers,
618                                                AggValueSlot::IsNotAliased,
619                                                Dest.isZeroed()));
620   } else if (LV.isSimple()) {
621     CGF.EmitScalarInit(E, /*D=*/0, LV, /*Captured=*/false);
622   } else {
623     CGF.EmitStoreThroughLValue(RValue::get(CGF.EmitScalarExpr(E)), LV);
624   }
625 }
626 
627 void AggExprEmitter::EmitNullInitializationToLValue(LValue lv) {
628   QualType type = lv.getType();
629 
630   // If the destination slot is already zeroed out before the aggregate is
631   // copied into it, we don't have to emit any zeros here.
632   if (Dest.isZeroed() && CGF.getTypes().isZeroInitializable(type))
633     return;
634 
635   if (!CGF.hasAggregateLLVMType(type)) {
636     // For non-aggregates, we can store zero
637     llvm::Value *null = llvm::Constant::getNullValue(CGF.ConvertType(type));
638     CGF.EmitStoreThroughLValue(RValue::get(null), lv);
639   } else {
640     // There's a potential optimization opportunity in combining
641     // memsets; that would be easy for arrays, but relatively
642     // difficult for structures with the current code.
643     CGF.EmitNullInitialization(lv.getAddress(), lv.getType());
644   }
645 }
646 
647 void AggExprEmitter::VisitInitListExpr(InitListExpr *E) {
648 #if 0
649   // FIXME: Assess perf here?  Figure out what cases are worth optimizing here
650   // (Length of globals? Chunks of zeroed-out space?).
651   //
652   // If we can, prefer a copy from a global; this is a lot less code for long
653   // globals, and it's easier for the current optimizers to analyze.
654   if (llvm::Constant* C = CGF.CGM.EmitConstantExpr(E, E->getType(), &CGF)) {
655     llvm::GlobalVariable* GV =
656     new llvm::GlobalVariable(CGF.CGM.getModule(), C->getType(), true,
657                              llvm::GlobalValue::InternalLinkage, C, "");
658     EmitFinalDestCopy(E, CGF.MakeAddrLValue(GV, E->getType()));
659     return;
660   }
661 #endif
662   if (E->hadArrayRangeDesignator())
663     CGF.ErrorUnsupported(E, "GNU array range designator extension");
664 
665   llvm::Value *DestPtr = Dest.getAddr();
666 
667   // Handle initialization of an array.
668   if (E->getType()->isArrayType()) {
669     llvm::PointerType *APType =
670       cast<llvm::PointerType>(DestPtr->getType());
671     llvm::ArrayType *AType =
672       cast<llvm::ArrayType>(APType->getElementType());
673 
674     uint64_t NumInitElements = E->getNumInits();
675 
676     if (E->getNumInits() > 0) {
677       QualType T1 = E->getType();
678       QualType T2 = E->getInit(0)->getType();
679       if (CGF.getContext().hasSameUnqualifiedType(T1, T2)) {
680         EmitAggLoadOfLValue(E->getInit(0));
681         return;
682       }
683     }
684 
685     uint64_t NumArrayElements = AType->getNumElements();
686     assert(NumInitElements <= NumArrayElements);
687 
688     QualType elementType = E->getType().getCanonicalType();
689     elementType = CGF.getContext().getQualifiedType(
690                     cast<ArrayType>(elementType)->getElementType(),
691                     elementType.getQualifiers() + Dest.getQualifiers());
692 
693     // DestPtr is an array*.  Construct an elementType* by drilling
694     // down a level.
695     llvm::Value *zero = llvm::ConstantInt::get(CGF.SizeTy, 0);
696     llvm::Value *indices[] = { zero, zero };
697     llvm::Value *begin =
698       Builder.CreateInBoundsGEP(DestPtr, indices, "arrayinit.begin");
699 
700     // Exception safety requires us to destroy all the
701     // already-constructed members if an initializer throws.
702     // For that, we'll need an EH cleanup.
703     QualType::DestructionKind dtorKind = elementType.isDestructedType();
704     llvm::AllocaInst *endOfInit = 0;
705     EHScopeStack::stable_iterator cleanup;
706     if (CGF.needsEHCleanup(dtorKind)) {
707       // In principle we could tell the cleanup where we are more
708       // directly, but the control flow can get so varied here that it
709       // would actually be quite complex.  Therefore we go through an
710       // alloca.
711       endOfInit = CGF.CreateTempAlloca(begin->getType(),
712                                        "arrayinit.endOfInit");
713       Builder.CreateStore(begin, endOfInit);
714       CGF.pushIrregularPartialArrayCleanup(begin, endOfInit, elementType,
715                                            CGF.getDestroyer(dtorKind));
716       cleanup = CGF.EHStack.stable_begin();
717 
718     // Otherwise, remember that we didn't need a cleanup.
719     } else {
720       dtorKind = QualType::DK_none;
721     }
722 
723     llvm::Value *one = llvm::ConstantInt::get(CGF.SizeTy, 1);
724 
725     // The 'current element to initialize'.  The invariants on this
726     // variable are complicated.  Essentially, after each iteration of
727     // the loop, it points to the last initialized element, except
728     // that it points to the beginning of the array before any
729     // elements have been initialized.
730     llvm::Value *element = begin;
731 
732     // Emit the explicit initializers.
733     for (uint64_t i = 0; i != NumInitElements; ++i) {
734       // Advance to the next element.
735       if (i > 0) {
736         element = Builder.CreateInBoundsGEP(element, one, "arrayinit.element");
737 
738         // Tell the cleanup that it needs to destroy up to this
739         // element.  TODO: some of these stores can be trivially
740         // observed to be unnecessary.
741         if (endOfInit) Builder.CreateStore(element, endOfInit);
742       }
743 
744       LValue elementLV = CGF.MakeAddrLValue(element, elementType);
745       EmitInitializationToLValue(E->getInit(i), elementLV);
746     }
747 
748     // Check whether there's a non-trivial array-fill expression.
749     // Note that this will be a CXXConstructExpr even if the element
750     // type is an array (or array of array, etc.) of class type.
751     Expr *filler = E->getArrayFiller();
752     bool hasTrivialFiller = true;
753     if (CXXConstructExpr *cons = dyn_cast_or_null<CXXConstructExpr>(filler)) {
754       assert(cons->getConstructor()->isDefaultConstructor());
755       hasTrivialFiller = cons->getConstructor()->isTrivial();
756     }
757 
758     // Any remaining elements need to be zero-initialized, possibly
759     // using the filler expression.  We can skip this if the we're
760     // emitting to zeroed memory.
761     if (NumInitElements != NumArrayElements &&
762         !(Dest.isZeroed() && hasTrivialFiller &&
763           CGF.getTypes().isZeroInitializable(elementType))) {
764 
765       // Use an actual loop.  This is basically
766       //   do { *array++ = filler; } while (array != end);
767 
768       // Advance to the start of the rest of the array.
769       if (NumInitElements) {
770         element = Builder.CreateInBoundsGEP(element, one, "arrayinit.start");
771         if (endOfInit) Builder.CreateStore(element, endOfInit);
772       }
773 
774       // Compute the end of the array.
775       llvm::Value *end = Builder.CreateInBoundsGEP(begin,
776                         llvm::ConstantInt::get(CGF.SizeTy, NumArrayElements),
777                                                    "arrayinit.end");
778 
779       llvm::BasicBlock *entryBB = Builder.GetInsertBlock();
780       llvm::BasicBlock *bodyBB = CGF.createBasicBlock("arrayinit.body");
781 
782       // Jump into the body.
783       CGF.EmitBlock(bodyBB);
784       llvm::PHINode *currentElement =
785         Builder.CreatePHI(element->getType(), 2, "arrayinit.cur");
786       currentElement->addIncoming(element, entryBB);
787 
788       // Emit the actual filler expression.
789       LValue elementLV = CGF.MakeAddrLValue(currentElement, elementType);
790       if (filler)
791         EmitInitializationToLValue(filler, elementLV);
792       else
793         EmitNullInitializationToLValue(elementLV);
794 
795       // Move on to the next element.
796       llvm::Value *nextElement =
797         Builder.CreateInBoundsGEP(currentElement, one, "arrayinit.next");
798 
799       // Tell the EH cleanup that we finished with the last element.
800       if (endOfInit) Builder.CreateStore(nextElement, endOfInit);
801 
802       // Leave the loop if we're done.
803       llvm::Value *done = Builder.CreateICmpEQ(nextElement, end,
804                                                "arrayinit.done");
805       llvm::BasicBlock *endBB = CGF.createBasicBlock("arrayinit.end");
806       Builder.CreateCondBr(done, endBB, bodyBB);
807       currentElement->addIncoming(nextElement, Builder.GetInsertBlock());
808 
809       CGF.EmitBlock(endBB);
810     }
811 
812     // Leave the partial-array cleanup if we entered one.
813     if (dtorKind) CGF.DeactivateCleanupBlock(cleanup);
814 
815     return;
816   }
817 
818   assert(E->getType()->isRecordType() && "Only support structs/unions here!");
819 
820   // Do struct initialization; this code just sets each individual member
821   // to the approprate value.  This makes bitfield support automatic;
822   // the disadvantage is that the generated code is more difficult for
823   // the optimizer, especially with bitfields.
824   unsigned NumInitElements = E->getNumInits();
825   RecordDecl *record = E->getType()->castAs<RecordType>()->getDecl();
826 
827   if (record->isUnion()) {
828     // Only initialize one field of a union. The field itself is
829     // specified by the initializer list.
830     if (!E->getInitializedFieldInUnion()) {
831       // Empty union; we have nothing to do.
832 
833 #ifndef NDEBUG
834       // Make sure that it's really an empty and not a failure of
835       // semantic analysis.
836       for (RecordDecl::field_iterator Field = record->field_begin(),
837                                    FieldEnd = record->field_end();
838            Field != FieldEnd; ++Field)
839         assert(Field->isUnnamedBitfield() && "Only unnamed bitfields allowed");
840 #endif
841       return;
842     }
843 
844     // FIXME: volatility
845     FieldDecl *Field = E->getInitializedFieldInUnion();
846 
847     LValue FieldLoc = CGF.EmitLValueForFieldInitialization(DestPtr, Field, 0);
848     if (NumInitElements) {
849       // Store the initializer into the field
850       EmitInitializationToLValue(E->getInit(0), FieldLoc);
851     } else {
852       // Default-initialize to null.
853       EmitNullInitializationToLValue(FieldLoc);
854     }
855 
856     return;
857   }
858 
859   // We'll need to enter cleanup scopes in case any of the member
860   // initializers throw an exception.
861   SmallVector<EHScopeStack::stable_iterator, 16> cleanups;
862 
863   // Here we iterate over the fields; this makes it simpler to both
864   // default-initialize fields and skip over unnamed fields.
865   unsigned curInitIndex = 0;
866   for (RecordDecl::field_iterator field = record->field_begin(),
867                                fieldEnd = record->field_end();
868        field != fieldEnd; ++field) {
869     // We're done once we hit the flexible array member.
870     if (field->getType()->isIncompleteArrayType())
871       break;
872 
873     // Always skip anonymous bitfields.
874     if (field->isUnnamedBitfield())
875       continue;
876 
877     // We're done if we reach the end of the explicit initializers, we
878     // have a zeroed object, and the rest of the fields are
879     // zero-initializable.
880     if (curInitIndex == NumInitElements && Dest.isZeroed() &&
881         CGF.getTypes().isZeroInitializable(E->getType()))
882       break;
883 
884     // FIXME: volatility
885     LValue LV = CGF.EmitLValueForFieldInitialization(DestPtr, *field, 0);
886     // We never generate write-barries for initialized fields.
887     LV.setNonGC(true);
888 
889     if (curInitIndex < NumInitElements) {
890       // Store the initializer into the field.
891       EmitInitializationToLValue(E->getInit(curInitIndex++), LV);
892     } else {
893       // We're out of initalizers; default-initialize to null
894       EmitNullInitializationToLValue(LV);
895     }
896 
897     // Push a destructor if necessary.
898     // FIXME: if we have an array of structures, all explicitly
899     // initialized, we can end up pushing a linear number of cleanups.
900     bool pushedCleanup = false;
901     if (QualType::DestructionKind dtorKind
902           = field->getType().isDestructedType()) {
903       assert(LV.isSimple());
904       if (CGF.needsEHCleanup(dtorKind)) {
905         CGF.pushDestroy(EHCleanup, LV.getAddress(), field->getType(),
906                         CGF.getDestroyer(dtorKind), false);
907         cleanups.push_back(CGF.EHStack.stable_begin());
908         pushedCleanup = true;
909       }
910     }
911 
912     // If the GEP didn't get used because of a dead zero init or something
913     // else, clean it up for -O0 builds and general tidiness.
914     if (!pushedCleanup && LV.isSimple())
915       if (llvm::GetElementPtrInst *GEP =
916             dyn_cast<llvm::GetElementPtrInst>(LV.getAddress()))
917         if (GEP->use_empty())
918           GEP->eraseFromParent();
919   }
920 
921   // Deactivate all the partial cleanups in reverse order, which
922   // generally means popping them.
923   for (unsigned i = cleanups.size(); i != 0; --i)
924     CGF.DeactivateCleanupBlock(cleanups[i-1]);
925 }
926 
927 //===----------------------------------------------------------------------===//
928 //                        Entry Points into this File
929 //===----------------------------------------------------------------------===//
930 
931 /// GetNumNonZeroBytesInInit - Get an approximate count of the number of
932 /// non-zero bytes that will be stored when outputting the initializer for the
933 /// specified initializer expression.
934 static CharUnits GetNumNonZeroBytesInInit(const Expr *E, CodeGenFunction &CGF) {
935   E = E->IgnoreParens();
936 
937   // 0 and 0.0 won't require any non-zero stores!
938   if (isSimpleZero(E, CGF)) return CharUnits::Zero();
939 
940   // If this is an initlist expr, sum up the size of sizes of the (present)
941   // elements.  If this is something weird, assume the whole thing is non-zero.
942   const InitListExpr *ILE = dyn_cast<InitListExpr>(E);
943   if (ILE == 0 || !CGF.getTypes().isZeroInitializable(ILE->getType()))
944     return CGF.getContext().getTypeSizeInChars(E->getType());
945 
946   // InitListExprs for structs have to be handled carefully.  If there are
947   // reference members, we need to consider the size of the reference, not the
948   // referencee.  InitListExprs for unions and arrays can't have references.
949   if (const RecordType *RT = E->getType()->getAs<RecordType>()) {
950     if (!RT->isUnionType()) {
951       RecordDecl *SD = E->getType()->getAs<RecordType>()->getDecl();
952       CharUnits NumNonZeroBytes = CharUnits::Zero();
953 
954       unsigned ILEElement = 0;
955       for (RecordDecl::field_iterator Field = SD->field_begin(),
956            FieldEnd = SD->field_end(); Field != FieldEnd; ++Field) {
957         // We're done once we hit the flexible array member or run out of
958         // InitListExpr elements.
959         if (Field->getType()->isIncompleteArrayType() ||
960             ILEElement == ILE->getNumInits())
961           break;
962         if (Field->isUnnamedBitfield())
963           continue;
964 
965         const Expr *E = ILE->getInit(ILEElement++);
966 
967         // Reference values are always non-null and have the width of a pointer.
968         if (Field->getType()->isReferenceType())
969           NumNonZeroBytes += CGF.getContext().toCharUnitsFromBits(
970               CGF.getContext().getTargetInfo().getPointerWidth(0));
971         else
972           NumNonZeroBytes += GetNumNonZeroBytesInInit(E, CGF);
973       }
974 
975       return NumNonZeroBytes;
976     }
977   }
978 
979 
980   CharUnits NumNonZeroBytes = CharUnits::Zero();
981   for (unsigned i = 0, e = ILE->getNumInits(); i != e; ++i)
982     NumNonZeroBytes += GetNumNonZeroBytesInInit(ILE->getInit(i), CGF);
983   return NumNonZeroBytes;
984 }
985 
986 /// CheckAggExprForMemSetUse - If the initializer is large and has a lot of
987 /// zeros in it, emit a memset and avoid storing the individual zeros.
988 ///
989 static void CheckAggExprForMemSetUse(AggValueSlot &Slot, const Expr *E,
990                                      CodeGenFunction &CGF) {
991   // If the slot is already known to be zeroed, nothing to do.  Don't mess with
992   // volatile stores.
993   if (Slot.isZeroed() || Slot.isVolatile() || Slot.getAddr() == 0) return;
994 
995   // C++ objects with a user-declared constructor don't need zero'ing.
996   if (CGF.getContext().getLangOptions().CPlusPlus)
997     if (const RecordType *RT = CGF.getContext()
998                        .getBaseElementType(E->getType())->getAs<RecordType>()) {
999       const CXXRecordDecl *RD = cast<CXXRecordDecl>(RT->getDecl());
1000       if (RD->hasUserDeclaredConstructor())
1001         return;
1002     }
1003 
1004   // If the type is 16-bytes or smaller, prefer individual stores over memset.
1005   std::pair<CharUnits, CharUnits> TypeInfo =
1006     CGF.getContext().getTypeInfoInChars(E->getType());
1007   if (TypeInfo.first <= CharUnits::fromQuantity(16))
1008     return;
1009 
1010   // Check to see if over 3/4 of the initializer are known to be zero.  If so,
1011   // we prefer to emit memset + individual stores for the rest.
1012   CharUnits NumNonZeroBytes = GetNumNonZeroBytesInInit(E, CGF);
1013   if (NumNonZeroBytes*4 > TypeInfo.first)
1014     return;
1015 
1016   // Okay, it seems like a good idea to use an initial memset, emit the call.
1017   llvm::Constant *SizeVal = CGF.Builder.getInt64(TypeInfo.first.getQuantity());
1018   CharUnits Align = TypeInfo.second;
1019 
1020   llvm::Value *Loc = Slot.getAddr();
1021   llvm::Type *BP = llvm::Type::getInt8PtrTy(CGF.getLLVMContext());
1022 
1023   Loc = CGF.Builder.CreateBitCast(Loc, BP);
1024   CGF.Builder.CreateMemSet(Loc, CGF.Builder.getInt8(0), SizeVal,
1025                            Align.getQuantity(), false);
1026 
1027   // Tell the AggExprEmitter that the slot is known zero.
1028   Slot.setZeroed();
1029 }
1030 
1031 
1032 
1033 
1034 /// EmitAggExpr - Emit the computation of the specified expression of aggregate
1035 /// type.  The result is computed into DestPtr.  Note that if DestPtr is null,
1036 /// the value of the aggregate expression is not needed.  If VolatileDest is
1037 /// true, DestPtr cannot be 0.
1038 ///
1039 /// \param IsInitializer - true if this evaluation is initializing an
1040 /// object whose lifetime is already being managed.
1041 void CodeGenFunction::EmitAggExpr(const Expr *E, AggValueSlot Slot,
1042                                   bool IgnoreResult) {
1043   assert(E && hasAggregateLLVMType(E->getType()) &&
1044          "Invalid aggregate expression to emit");
1045   assert((Slot.getAddr() != 0 || Slot.isIgnored()) &&
1046          "slot has bits but no address");
1047 
1048   // Optimize the slot if possible.
1049   CheckAggExprForMemSetUse(Slot, E, *this);
1050 
1051   AggExprEmitter(*this, Slot, IgnoreResult).Visit(const_cast<Expr*>(E));
1052 }
1053 
1054 LValue CodeGenFunction::EmitAggExprToLValue(const Expr *E) {
1055   assert(hasAggregateLLVMType(E->getType()) && "Invalid argument!");
1056   llvm::Value *Temp = CreateMemTemp(E->getType());
1057   LValue LV = MakeAddrLValue(Temp, E->getType());
1058   EmitAggExpr(E, AggValueSlot::forLValue(LV, AggValueSlot::IsNotDestructed,
1059                                          AggValueSlot::DoesNotNeedGCBarriers,
1060                                          AggValueSlot::IsNotAliased));
1061   return LV;
1062 }
1063 
1064 void CodeGenFunction::EmitAggregateCopy(llvm::Value *DestPtr,
1065                                         llvm::Value *SrcPtr, QualType Ty,
1066                                         bool isVolatile) {
1067   assert(!Ty->isAnyComplexType() && "Shouldn't happen for complex");
1068 
1069   if (getContext().getLangOptions().CPlusPlus) {
1070     if (const RecordType *RT = Ty->getAs<RecordType>()) {
1071       CXXRecordDecl *Record = cast<CXXRecordDecl>(RT->getDecl());
1072       assert((Record->hasTrivialCopyConstructor() ||
1073               Record->hasTrivialCopyAssignment() ||
1074               Record->hasTrivialMoveConstructor() ||
1075               Record->hasTrivialMoveAssignment()) &&
1076              "Trying to aggregate-copy a type without a trivial copy "
1077              "constructor or assignment operator");
1078       // Ignore empty classes in C++.
1079       if (Record->isEmpty())
1080         return;
1081     }
1082   }
1083 
1084   // Aggregate assignment turns into llvm.memcpy.  This is almost valid per
1085   // C99 6.5.16.1p3, which states "If the value being stored in an object is
1086   // read from another object that overlaps in anyway the storage of the first
1087   // object, then the overlap shall be exact and the two objects shall have
1088   // qualified or unqualified versions of a compatible type."
1089   //
1090   // memcpy is not defined if the source and destination pointers are exactly
1091   // equal, but other compilers do this optimization, and almost every memcpy
1092   // implementation handles this case safely.  If there is a libc that does not
1093   // safely handle this, we can add a target hook.
1094 
1095   // Get size and alignment info for this aggregate.
1096   std::pair<CharUnits, CharUnits> TypeInfo =
1097     getContext().getTypeInfoInChars(Ty);
1098 
1099   // FIXME: Handle variable sized types.
1100 
1101   // FIXME: If we have a volatile struct, the optimizer can remove what might
1102   // appear to be `extra' memory ops:
1103   //
1104   // volatile struct { int i; } a, b;
1105   //
1106   // int main() {
1107   //   a = b;
1108   //   a = b;
1109   // }
1110   //
1111   // we need to use a different call here.  We use isVolatile to indicate when
1112   // either the source or the destination is volatile.
1113 
1114   llvm::PointerType *DPT = cast<llvm::PointerType>(DestPtr->getType());
1115   llvm::Type *DBP =
1116     llvm::Type::getInt8PtrTy(getLLVMContext(), DPT->getAddressSpace());
1117   DestPtr = Builder.CreateBitCast(DestPtr, DBP, "tmp");
1118 
1119   llvm::PointerType *SPT = cast<llvm::PointerType>(SrcPtr->getType());
1120   llvm::Type *SBP =
1121     llvm::Type::getInt8PtrTy(getLLVMContext(), SPT->getAddressSpace());
1122   SrcPtr = Builder.CreateBitCast(SrcPtr, SBP, "tmp");
1123 
1124   // Don't do any of the memmove_collectable tests if GC isn't set.
1125   if (CGM.getLangOptions().getGCMode() == LangOptions::NonGC) {
1126     // fall through
1127   } else if (const RecordType *RecordTy = Ty->getAs<RecordType>()) {
1128     RecordDecl *Record = RecordTy->getDecl();
1129     if (Record->hasObjectMember()) {
1130       CharUnits size = TypeInfo.first;
1131       llvm::Type *SizeTy = ConvertType(getContext().getSizeType());
1132       llvm::Value *SizeVal = llvm::ConstantInt::get(SizeTy, size.getQuantity());
1133       CGM.getObjCRuntime().EmitGCMemmoveCollectable(*this, DestPtr, SrcPtr,
1134                                                     SizeVal);
1135       return;
1136     }
1137   } else if (Ty->isArrayType()) {
1138     QualType BaseType = getContext().getBaseElementType(Ty);
1139     if (const RecordType *RecordTy = BaseType->getAs<RecordType>()) {
1140       if (RecordTy->getDecl()->hasObjectMember()) {
1141         CharUnits size = TypeInfo.first;
1142         llvm::Type *SizeTy = ConvertType(getContext().getSizeType());
1143         llvm::Value *SizeVal =
1144           llvm::ConstantInt::get(SizeTy, size.getQuantity());
1145         CGM.getObjCRuntime().EmitGCMemmoveCollectable(*this, DestPtr, SrcPtr,
1146                                                       SizeVal);
1147         return;
1148       }
1149     }
1150   }
1151 
1152   Builder.CreateMemCpy(DestPtr, SrcPtr,
1153                        llvm::ConstantInt::get(IntPtrTy,
1154                                               TypeInfo.first.getQuantity()),
1155                        TypeInfo.second.getQuantity(), isVolatile);
1156 }
1157