1 //===--- CGBlocks.cpp - Emit LLVM Code for declarations -------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This contains code to emit blocks.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "CGBlocks.h"
15 #include "CGDebugInfo.h"
16 #include "CGObjCRuntime.h"
17 #include "CodeGenFunction.h"
18 #include "CodeGenModule.h"
19 #include "clang/AST/DeclObjC.h"
20 #include "llvm/ADT/SmallSet.h"
21 #include "llvm/IR/DataLayout.h"
22 #include "llvm/IR/Module.h"
23 #include "llvm/Support/CallSite.h"
24 #include <algorithm>
25 #include <cstdio>
26 
27 using namespace clang;
28 using namespace CodeGen;
29 
30 CGBlockInfo::CGBlockInfo(const BlockDecl *block, StringRef name)
31   : Name(name), CXXThisIndex(0), CanBeGlobal(false), NeedsCopyDispose(false),
32     HasCXXObject(false), UsesStret(false), HasCapturedVariableLayout(false),
33     StructureType(0), Block(block),
34     DominatingIP(0) {
35 
36   // Skip asm prefix, if any.  'name' is usually taken directly from
37   // the mangled name of the enclosing function.
38   if (!name.empty() && name[0] == '\01')
39     name = name.substr(1);
40 }
41 
42 // Anchor the vtable to this translation unit.
43 CodeGenModule::ByrefHelpers::~ByrefHelpers() {}
44 
45 /// Build the given block as a global block.
46 static llvm::Constant *buildGlobalBlock(CodeGenModule &CGM,
47                                         const CGBlockInfo &blockInfo,
48                                         llvm::Constant *blockFn);
49 
50 /// Build the helper function to copy a block.
51 static llvm::Constant *buildCopyHelper(CodeGenModule &CGM,
52                                        const CGBlockInfo &blockInfo) {
53   return CodeGenFunction(CGM).GenerateCopyHelperFunction(blockInfo);
54 }
55 
56 /// Build the helper function to dipose of a block.
57 static llvm::Constant *buildDisposeHelper(CodeGenModule &CGM,
58                                           const CGBlockInfo &blockInfo) {
59   return CodeGenFunction(CGM).GenerateDestroyHelperFunction(blockInfo);
60 }
61 
62 /// buildBlockDescriptor - Build the block descriptor meta-data for a block.
63 /// buildBlockDescriptor is accessed from 5th field of the Block_literal
64 /// meta-data and contains stationary information about the block literal.
65 /// Its definition will have 4 (or optinally 6) words.
66 /// struct Block_descriptor {
67 ///   unsigned long reserved;
68 ///   unsigned long size;  // size of Block_literal metadata in bytes.
69 ///   void *copy_func_helper_decl;  // optional copy helper.
70 ///   void *destroy_func_decl; // optioanl destructor helper.
71 ///   void *block_method_encoding_address;//@encode for block literal signature.
72 ///   void *block_layout_info; // encoding of captured block variables.
73 /// };
74 static llvm::Constant *buildBlockDescriptor(CodeGenModule &CGM,
75                                             const CGBlockInfo &blockInfo) {
76   ASTContext &C = CGM.getContext();
77 
78   llvm::Type *ulong = CGM.getTypes().ConvertType(C.UnsignedLongTy);
79   llvm::Type *i8p = CGM.getTypes().ConvertType(C.VoidPtrTy);
80 
81   SmallVector<llvm::Constant*, 6> elements;
82 
83   // reserved
84   elements.push_back(llvm::ConstantInt::get(ulong, 0));
85 
86   // Size
87   // FIXME: What is the right way to say this doesn't fit?  We should give
88   // a user diagnostic in that case.  Better fix would be to change the
89   // API to size_t.
90   elements.push_back(llvm::ConstantInt::get(ulong,
91                                             blockInfo.BlockSize.getQuantity()));
92 
93   // Optional copy/dispose helpers.
94   if (blockInfo.NeedsCopyDispose) {
95     // copy_func_helper_decl
96     elements.push_back(buildCopyHelper(CGM, blockInfo));
97 
98     // destroy_func_decl
99     elements.push_back(buildDisposeHelper(CGM, blockInfo));
100   }
101 
102   // Signature.  Mandatory ObjC-style method descriptor @encode sequence.
103   std::string typeAtEncoding =
104     CGM.getContext().getObjCEncodingForBlock(blockInfo.getBlockExpr());
105   elements.push_back(llvm::ConstantExpr::getBitCast(
106                           CGM.GetAddrOfConstantCString(typeAtEncoding), i8p));
107 
108   // GC layout.
109   if (C.getLangOpts().ObjC1) {
110     if (CGM.getLangOpts().getGC() != LangOptions::NonGC)
111       elements.push_back(CGM.getObjCRuntime().BuildGCBlockLayout(CGM, blockInfo));
112     else
113       elements.push_back(CGM.getObjCRuntime().BuildRCBlockLayout(CGM, blockInfo));
114   }
115   else
116     elements.push_back(llvm::Constant::getNullValue(i8p));
117 
118   llvm::Constant *init = llvm::ConstantStruct::getAnon(elements);
119 
120   llvm::GlobalVariable *global =
121     new llvm::GlobalVariable(CGM.getModule(), init->getType(), true,
122                              llvm::GlobalValue::InternalLinkage,
123                              init, "__block_descriptor_tmp");
124 
125   return llvm::ConstantExpr::getBitCast(global, CGM.getBlockDescriptorType());
126 }
127 
128 /*
129   Purely notional variadic template describing the layout of a block.
130 
131   template <class _ResultType, class... _ParamTypes, class... _CaptureTypes>
132   struct Block_literal {
133     /// Initialized to one of:
134     ///   extern void *_NSConcreteStackBlock[];
135     ///   extern void *_NSConcreteGlobalBlock[];
136     ///
137     /// In theory, we could start one off malloc'ed by setting
138     /// BLOCK_NEEDS_FREE, giving it a refcount of 1, and using
139     /// this isa:
140     ///   extern void *_NSConcreteMallocBlock[];
141     struct objc_class *isa;
142 
143     /// These are the flags (with corresponding bit number) that the
144     /// compiler is actually supposed to know about.
145     ///  25. BLOCK_HAS_COPY_DISPOSE - indicates that the block
146     ///   descriptor provides copy and dispose helper functions
147     ///  26. BLOCK_HAS_CXX_OBJ - indicates that there's a captured
148     ///   object with a nontrivial destructor or copy constructor
149     ///  28. BLOCK_IS_GLOBAL - indicates that the block is allocated
150     ///   as global memory
151     ///  29. BLOCK_USE_STRET - indicates that the block function
152     ///   uses stret, which objc_msgSend needs to know about
153     ///  30. BLOCK_HAS_SIGNATURE - indicates that the block has an
154     ///   @encoded signature string
155     /// And we're not supposed to manipulate these:
156     ///  24. BLOCK_NEEDS_FREE - indicates that the block has been moved
157     ///   to malloc'ed memory
158     ///  27. BLOCK_IS_GC - indicates that the block has been moved to
159     ///   to GC-allocated memory
160     /// Additionally, the bottom 16 bits are a reference count which
161     /// should be zero on the stack.
162     int flags;
163 
164     /// Reserved;  should be zero-initialized.
165     int reserved;
166 
167     /// Function pointer generated from block literal.
168     _ResultType (*invoke)(Block_literal *, _ParamTypes...);
169 
170     /// Block description metadata generated from block literal.
171     struct Block_descriptor *block_descriptor;
172 
173     /// Captured values follow.
174     _CapturesTypes captures...;
175   };
176  */
177 
178 /// The number of fields in a block header.
179 const unsigned BlockHeaderSize = 5;
180 
181 namespace {
182   /// A chunk of data that we actually have to capture in the block.
183   struct BlockLayoutChunk {
184     CharUnits Alignment;
185     CharUnits Size;
186     Qualifiers::ObjCLifetime Lifetime;
187     const BlockDecl::Capture *Capture; // null for 'this'
188     llvm::Type *Type;
189 
190     BlockLayoutChunk(CharUnits align, CharUnits size,
191                      Qualifiers::ObjCLifetime lifetime,
192                      const BlockDecl::Capture *capture,
193                      llvm::Type *type)
194       : Alignment(align), Size(size), Lifetime(lifetime),
195         Capture(capture), Type(type) {}
196 
197     /// Tell the block info that this chunk has the given field index.
198     void setIndex(CGBlockInfo &info, unsigned index) {
199       if (!Capture)
200         info.CXXThisIndex = index;
201       else
202         info.Captures[Capture->getVariable()]
203           = CGBlockInfo::Capture::makeIndex(index);
204     }
205   };
206 
207   /// Order by 1) all __strong together 2) next, all byfref together 3) next,
208   /// all __weak together. Preserve descending alignment in all situations.
209   bool operator<(const BlockLayoutChunk &left, const BlockLayoutChunk &right) {
210     CharUnits LeftValue, RightValue;
211     bool LeftByref = left.Capture ? left.Capture->isByRef() : false;
212     bool RightByref = right.Capture ? right.Capture->isByRef() : false;
213 
214     if (left.Lifetime == Qualifiers::OCL_Strong &&
215         left.Alignment >= right.Alignment)
216       LeftValue = CharUnits::fromQuantity(64);
217     else if (LeftByref && left.Alignment >= right.Alignment)
218       LeftValue = CharUnits::fromQuantity(32);
219     else if (left.Lifetime == Qualifiers::OCL_Weak &&
220              left.Alignment >= right.Alignment)
221       LeftValue = CharUnits::fromQuantity(16);
222     else
223       LeftValue = left.Alignment;
224     if (right.Lifetime == Qualifiers::OCL_Strong &&
225         right.Alignment >= left.Alignment)
226       RightValue = CharUnits::fromQuantity(64);
227     else if (RightByref && right.Alignment >= left.Alignment)
228       RightValue = CharUnits::fromQuantity(32);
229     else if (right.Lifetime == Qualifiers::OCL_Weak &&
230              right.Alignment >= left.Alignment)
231       RightValue = CharUnits::fromQuantity(16);
232     else
233       RightValue = right.Alignment;
234 
235       return LeftValue > RightValue;
236   }
237 }
238 
239 /// Determines if the given type is safe for constant capture in C++.
240 static bool isSafeForCXXConstantCapture(QualType type) {
241   const RecordType *recordType =
242     type->getBaseElementTypeUnsafe()->getAs<RecordType>();
243 
244   // Only records can be unsafe.
245   if (!recordType) return true;
246 
247   const CXXRecordDecl *record = cast<CXXRecordDecl>(recordType->getDecl());
248 
249   // Maintain semantics for classes with non-trivial dtors or copy ctors.
250   if (!record->hasTrivialDestructor()) return false;
251   if (record->hasNonTrivialCopyConstructor()) return false;
252 
253   // Otherwise, we just have to make sure there aren't any mutable
254   // fields that might have changed since initialization.
255   return !record->hasMutableFields();
256 }
257 
258 /// It is illegal to modify a const object after initialization.
259 /// Therefore, if a const object has a constant initializer, we don't
260 /// actually need to keep storage for it in the block; we'll just
261 /// rematerialize it at the start of the block function.  This is
262 /// acceptable because we make no promises about address stability of
263 /// captured variables.
264 static llvm::Constant *tryCaptureAsConstant(CodeGenModule &CGM,
265                                             CodeGenFunction *CGF,
266                                             const VarDecl *var) {
267   QualType type = var->getType();
268 
269   // We can only do this if the variable is const.
270   if (!type.isConstQualified()) return 0;
271 
272   // Furthermore, in C++ we have to worry about mutable fields:
273   // C++ [dcl.type.cv]p4:
274   //   Except that any class member declared mutable can be
275   //   modified, any attempt to modify a const object during its
276   //   lifetime results in undefined behavior.
277   if (CGM.getLangOpts().CPlusPlus && !isSafeForCXXConstantCapture(type))
278     return 0;
279 
280   // If the variable doesn't have any initializer (shouldn't this be
281   // invalid?), it's not clear what we should do.  Maybe capture as
282   // zero?
283   const Expr *init = var->getInit();
284   if (!init) return 0;
285 
286   return CGM.EmitConstantInit(*var, CGF);
287 }
288 
289 /// Get the low bit of a nonzero character count.  This is the
290 /// alignment of the nth byte if the 0th byte is universally aligned.
291 static CharUnits getLowBit(CharUnits v) {
292   return CharUnits::fromQuantity(v.getQuantity() & (~v.getQuantity() + 1));
293 }
294 
295 static void initializeForBlockHeader(CodeGenModule &CGM, CGBlockInfo &info,
296                              SmallVectorImpl<llvm::Type*> &elementTypes) {
297   ASTContext &C = CGM.getContext();
298 
299   // The header is basically a 'struct { void *; int; int; void *; void *; }'.
300   CharUnits ptrSize, ptrAlign, intSize, intAlign;
301   llvm::tie(ptrSize, ptrAlign) = C.getTypeInfoInChars(C.VoidPtrTy);
302   llvm::tie(intSize, intAlign) = C.getTypeInfoInChars(C.IntTy);
303 
304   // Are there crazy embedded platforms where this isn't true?
305   assert(intSize <= ptrSize && "layout assumptions horribly violated");
306 
307   CharUnits headerSize = ptrSize;
308   if (2 * intSize < ptrAlign) headerSize += ptrSize;
309   else headerSize += 2 * intSize;
310   headerSize += 2 * ptrSize;
311 
312   info.BlockAlign = ptrAlign;
313   info.BlockSize = headerSize;
314 
315   assert(elementTypes.empty());
316   llvm::Type *i8p = CGM.getTypes().ConvertType(C.VoidPtrTy);
317   llvm::Type *intTy = CGM.getTypes().ConvertType(C.IntTy);
318   elementTypes.push_back(i8p);
319   elementTypes.push_back(intTy);
320   elementTypes.push_back(intTy);
321   elementTypes.push_back(i8p);
322   elementTypes.push_back(CGM.getBlockDescriptorType());
323 
324   assert(elementTypes.size() == BlockHeaderSize);
325 }
326 
327 /// Compute the layout of the given block.  Attempts to lay the block
328 /// out with minimal space requirements.
329 static void computeBlockInfo(CodeGenModule &CGM, CodeGenFunction *CGF,
330                              CGBlockInfo &info) {
331   ASTContext &C = CGM.getContext();
332   const BlockDecl *block = info.getBlockDecl();
333 
334   SmallVector<llvm::Type*, 8> elementTypes;
335   initializeForBlockHeader(CGM, info, elementTypes);
336 
337   if (!block->hasCaptures()) {
338     info.StructureType =
339       llvm::StructType::get(CGM.getLLVMContext(), elementTypes, true);
340     info.CanBeGlobal = true;
341     return;
342   }
343   else if (C.getLangOpts().ObjC1 &&
344            CGM.getLangOpts().getGC() == LangOptions::NonGC)
345     info.HasCapturedVariableLayout = true;
346 
347   // Collect the layout chunks.
348   SmallVector<BlockLayoutChunk, 16> layout;
349   layout.reserve(block->capturesCXXThis() +
350                  (block->capture_end() - block->capture_begin()));
351 
352   CharUnits maxFieldAlign;
353 
354   // First, 'this'.
355   if (block->capturesCXXThis()) {
356     const DeclContext *DC = block->getDeclContext();
357     for (; isa<BlockDecl>(DC); DC = cast<BlockDecl>(DC)->getDeclContext())
358       ;
359     QualType thisType;
360     if (const CXXRecordDecl *RD = dyn_cast<CXXRecordDecl>(DC))
361       thisType = C.getPointerType(C.getRecordType(RD));
362     else
363       thisType = cast<CXXMethodDecl>(DC)->getThisType(C);
364 
365     llvm::Type *llvmType = CGM.getTypes().ConvertType(thisType);
366     std::pair<CharUnits,CharUnits> tinfo
367       = CGM.getContext().getTypeInfoInChars(thisType);
368     maxFieldAlign = std::max(maxFieldAlign, tinfo.second);
369 
370     layout.push_back(BlockLayoutChunk(tinfo.second, tinfo.first,
371                                       Qualifiers::OCL_None,
372                                       0, llvmType));
373   }
374 
375   // Next, all the block captures.
376   for (BlockDecl::capture_const_iterator ci = block->capture_begin(),
377          ce = block->capture_end(); ci != ce; ++ci) {
378     const VarDecl *variable = ci->getVariable();
379 
380     if (ci->isByRef()) {
381       // We have to copy/dispose of the __block reference.
382       info.NeedsCopyDispose = true;
383 
384       // Just use void* instead of a pointer to the byref type.
385       QualType byRefPtrTy = C.VoidPtrTy;
386 
387       llvm::Type *llvmType = CGM.getTypes().ConvertType(byRefPtrTy);
388       std::pair<CharUnits,CharUnits> tinfo
389         = CGM.getContext().getTypeInfoInChars(byRefPtrTy);
390       maxFieldAlign = std::max(maxFieldAlign, tinfo.second);
391 
392       layout.push_back(BlockLayoutChunk(tinfo.second, tinfo.first,
393                                         Qualifiers::OCL_None,
394                                         &*ci, llvmType));
395       continue;
396     }
397 
398     // Otherwise, build a layout chunk with the size and alignment of
399     // the declaration.
400     if (llvm::Constant *constant = tryCaptureAsConstant(CGM, CGF, variable)) {
401       info.Captures[variable] = CGBlockInfo::Capture::makeConstant(constant);
402       continue;
403     }
404 
405     // If we have a lifetime qualifier, honor it for capture purposes.
406     // That includes *not* copying it if it's __unsafe_unretained.
407     Qualifiers::ObjCLifetime lifetime =
408       variable->getType().getObjCLifetime();
409     if (lifetime) {
410       switch (lifetime) {
411       case Qualifiers::OCL_None: llvm_unreachable("impossible");
412       case Qualifiers::OCL_ExplicitNone:
413       case Qualifiers::OCL_Autoreleasing:
414         break;
415 
416       case Qualifiers::OCL_Strong:
417       case Qualifiers::OCL_Weak:
418         info.NeedsCopyDispose = true;
419       }
420 
421     // Block pointers require copy/dispose.  So do Objective-C pointers.
422     } else if (variable->getType()->isObjCRetainableType()) {
423       info.NeedsCopyDispose = true;
424       // used for mrr below.
425       lifetime = Qualifiers::OCL_Strong;
426 
427     // So do types that require non-trivial copy construction.
428     } else if (ci->hasCopyExpr()) {
429       info.NeedsCopyDispose = true;
430       info.HasCXXObject = true;
431 
432     // And so do types with destructors.
433     } else if (CGM.getLangOpts().CPlusPlus) {
434       if (const CXXRecordDecl *record =
435             variable->getType()->getAsCXXRecordDecl()) {
436         if (!record->hasTrivialDestructor()) {
437           info.HasCXXObject = true;
438           info.NeedsCopyDispose = true;
439         }
440       }
441     }
442 
443     QualType VT = variable->getType();
444     CharUnits size = C.getTypeSizeInChars(VT);
445     CharUnits align = C.getDeclAlign(variable);
446 
447     maxFieldAlign = std::max(maxFieldAlign, align);
448 
449     llvm::Type *llvmType =
450       CGM.getTypes().ConvertTypeForMem(VT);
451 
452     layout.push_back(BlockLayoutChunk(align, size, lifetime, &*ci, llvmType));
453   }
454 
455   // If that was everything, we're done here.
456   if (layout.empty()) {
457     info.StructureType =
458       llvm::StructType::get(CGM.getLLVMContext(), elementTypes, true);
459     info.CanBeGlobal = true;
460     return;
461   }
462 
463   // Sort the layout by alignment.  We have to use a stable sort here
464   // to get reproducible results.  There should probably be an
465   // llvm::array_pod_stable_sort.
466   std::stable_sort(layout.begin(), layout.end());
467 
468   // Needed for blocks layout info.
469   info.BlockHeaderForcedGapOffset = info.BlockSize;
470   info.BlockHeaderForcedGapSize = CharUnits::Zero();
471 
472   CharUnits &blockSize = info.BlockSize;
473   info.BlockAlign = std::max(maxFieldAlign, info.BlockAlign);
474 
475   // Assuming that the first byte in the header is maximally aligned,
476   // get the alignment of the first byte following the header.
477   CharUnits endAlign = getLowBit(blockSize);
478 
479   // If the end of the header isn't satisfactorily aligned for the
480   // maximum thing, look for things that are okay with the header-end
481   // alignment, and keep appending them until we get something that's
482   // aligned right.  This algorithm is only guaranteed optimal if
483   // that condition is satisfied at some point; otherwise we can get
484   // things like:
485   //   header                 // next byte has alignment 4
486   //   something_with_size_5; // next byte has alignment 1
487   //   something_with_alignment_8;
488   // which has 7 bytes of padding, as opposed to the naive solution
489   // which might have less (?).
490   if (endAlign < maxFieldAlign) {
491     SmallVectorImpl<BlockLayoutChunk>::iterator
492       li = layout.begin() + 1, le = layout.end();
493 
494     // Look for something that the header end is already
495     // satisfactorily aligned for.
496     for (; li != le && endAlign < li->Alignment; ++li)
497       ;
498 
499     // If we found something that's naturally aligned for the end of
500     // the header, keep adding things...
501     if (li != le) {
502       SmallVectorImpl<BlockLayoutChunk>::iterator first = li;
503       for (; li != le; ++li) {
504         assert(endAlign >= li->Alignment);
505 
506         li->setIndex(info, elementTypes.size());
507         elementTypes.push_back(li->Type);
508         blockSize += li->Size;
509         endAlign = getLowBit(blockSize);
510 
511         // ...until we get to the alignment of the maximum field.
512         if (endAlign >= maxFieldAlign) {
513           if (li == first) {
514             // No user field was appended. So, a gap was added.
515             // Save total gap size for use in block layout bit map.
516             info.BlockHeaderForcedGapSize = li->Size;
517           }
518           break;
519         }
520       }
521       // Don't re-append everything we just appended.
522       layout.erase(first, li);
523     }
524   }
525 
526   assert(endAlign == getLowBit(blockSize));
527 
528   // At this point, we just have to add padding if the end align still
529   // isn't aligned right.
530   if (endAlign < maxFieldAlign) {
531     CharUnits newBlockSize = blockSize.RoundUpToAlignment(maxFieldAlign);
532     CharUnits padding = newBlockSize - blockSize;
533 
534     elementTypes.push_back(llvm::ArrayType::get(CGM.Int8Ty,
535                                                 padding.getQuantity()));
536     blockSize = newBlockSize;
537     endAlign = getLowBit(blockSize); // might be > maxFieldAlign
538   }
539 
540   assert(endAlign >= maxFieldAlign);
541   assert(endAlign == getLowBit(blockSize));
542   // Slam everything else on now.  This works because they have
543   // strictly decreasing alignment and we expect that size is always a
544   // multiple of alignment.
545   for (SmallVectorImpl<BlockLayoutChunk>::iterator
546          li = layout.begin(), le = layout.end(); li != le; ++li) {
547     assert(endAlign >= li->Alignment);
548     li->setIndex(info, elementTypes.size());
549     elementTypes.push_back(li->Type);
550     blockSize += li->Size;
551     endAlign = getLowBit(blockSize);
552   }
553 
554   info.StructureType =
555     llvm::StructType::get(CGM.getLLVMContext(), elementTypes, true);
556 }
557 
558 /// Enter the scope of a block.  This should be run at the entrance to
559 /// a full-expression so that the block's cleanups are pushed at the
560 /// right place in the stack.
561 static void enterBlockScope(CodeGenFunction &CGF, BlockDecl *block) {
562   assert(CGF.HaveInsertPoint());
563 
564   // Allocate the block info and place it at the head of the list.
565   CGBlockInfo &blockInfo =
566     *new CGBlockInfo(block, CGF.CurFn->getName());
567   blockInfo.NextBlockInfo = CGF.FirstBlockInfo;
568   CGF.FirstBlockInfo = &blockInfo;
569 
570   // Compute information about the layout, etc., of this block,
571   // pushing cleanups as necessary.
572   computeBlockInfo(CGF.CGM, &CGF, blockInfo);
573 
574   // Nothing else to do if it can be global.
575   if (blockInfo.CanBeGlobal) return;
576 
577   // Make the allocation for the block.
578   blockInfo.Address =
579     CGF.CreateTempAlloca(blockInfo.StructureType, "block");
580   blockInfo.Address->setAlignment(blockInfo.BlockAlign.getQuantity());
581 
582   // If there are cleanups to emit, enter them (but inactive).
583   if (!blockInfo.NeedsCopyDispose) return;
584 
585   // Walk through the captures (in order) and find the ones not
586   // captured by constant.
587   for (BlockDecl::capture_const_iterator ci = block->capture_begin(),
588          ce = block->capture_end(); ci != ce; ++ci) {
589     // Ignore __block captures; there's nothing special in the
590     // on-stack block that we need to do for them.
591     if (ci->isByRef()) continue;
592 
593     // Ignore variables that are constant-captured.
594     const VarDecl *variable = ci->getVariable();
595     CGBlockInfo::Capture &capture = blockInfo.getCapture(variable);
596     if (capture.isConstant()) continue;
597 
598     // Ignore objects that aren't destructed.
599     QualType::DestructionKind dtorKind =
600       variable->getType().isDestructedType();
601     if (dtorKind == QualType::DK_none) continue;
602 
603     CodeGenFunction::Destroyer *destroyer;
604 
605     // Block captures count as local values and have imprecise semantics.
606     // They also can't be arrays, so need to worry about that.
607     if (dtorKind == QualType::DK_objc_strong_lifetime) {
608       destroyer = CodeGenFunction::destroyARCStrongImprecise;
609     } else {
610       destroyer = CGF.getDestroyer(dtorKind);
611     }
612 
613     // GEP down to the address.
614     llvm::Value *addr = CGF.Builder.CreateStructGEP(blockInfo.Address,
615                                                     capture.getIndex());
616 
617     // We can use that GEP as the dominating IP.
618     if (!blockInfo.DominatingIP)
619       blockInfo.DominatingIP = cast<llvm::Instruction>(addr);
620 
621     CleanupKind cleanupKind = InactiveNormalCleanup;
622     bool useArrayEHCleanup = CGF.needsEHCleanup(dtorKind);
623     if (useArrayEHCleanup)
624       cleanupKind = InactiveNormalAndEHCleanup;
625 
626     CGF.pushDestroy(cleanupKind, addr, variable->getType(),
627                     destroyer, useArrayEHCleanup);
628 
629     // Remember where that cleanup was.
630     capture.setCleanup(CGF.EHStack.stable_begin());
631   }
632 }
633 
634 /// Enter a full-expression with a non-trivial number of objects to
635 /// clean up.  This is in this file because, at the moment, the only
636 /// kind of cleanup object is a BlockDecl*.
637 void CodeGenFunction::enterNonTrivialFullExpression(const ExprWithCleanups *E) {
638   assert(E->getNumObjects() != 0);
639   ArrayRef<ExprWithCleanups::CleanupObject> cleanups = E->getObjects();
640   for (ArrayRef<ExprWithCleanups::CleanupObject>::iterator
641          i = cleanups.begin(), e = cleanups.end(); i != e; ++i) {
642     enterBlockScope(*this, *i);
643   }
644 }
645 
646 /// Find the layout for the given block in a linked list and remove it.
647 static CGBlockInfo *findAndRemoveBlockInfo(CGBlockInfo **head,
648                                            const BlockDecl *block) {
649   while (true) {
650     assert(head && *head);
651     CGBlockInfo *cur = *head;
652 
653     // If this is the block we're looking for, splice it out of the list.
654     if (cur->getBlockDecl() == block) {
655       *head = cur->NextBlockInfo;
656       return cur;
657     }
658 
659     head = &cur->NextBlockInfo;
660   }
661 }
662 
663 /// Destroy a chain of block layouts.
664 void CodeGenFunction::destroyBlockInfos(CGBlockInfo *head) {
665   assert(head && "destroying an empty chain");
666   do {
667     CGBlockInfo *cur = head;
668     head = cur->NextBlockInfo;
669     delete cur;
670   } while (head != 0);
671 }
672 
673 /// Emit a block literal expression in the current function.
674 llvm::Value *CodeGenFunction::EmitBlockLiteral(const BlockExpr *blockExpr) {
675   // If the block has no captures, we won't have a pre-computed
676   // layout for it.
677   if (!blockExpr->getBlockDecl()->hasCaptures()) {
678     CGBlockInfo blockInfo(blockExpr->getBlockDecl(), CurFn->getName());
679     computeBlockInfo(CGM, this, blockInfo);
680     blockInfo.BlockExpression = blockExpr;
681     return EmitBlockLiteral(blockInfo);
682   }
683 
684   // Find the block info for this block and take ownership of it.
685   OwningPtr<CGBlockInfo> blockInfo;
686   blockInfo.reset(findAndRemoveBlockInfo(&FirstBlockInfo,
687                                          blockExpr->getBlockDecl()));
688 
689   blockInfo->BlockExpression = blockExpr;
690   return EmitBlockLiteral(*blockInfo);
691 }
692 
693 llvm::Value *CodeGenFunction::EmitBlockLiteral(const CGBlockInfo &blockInfo) {
694   // Using the computed layout, generate the actual block function.
695   bool isLambdaConv = blockInfo.getBlockDecl()->isConversionFromLambda();
696   llvm::Constant *blockFn
697     = CodeGenFunction(CGM, true).GenerateBlockFunction(CurGD, blockInfo,
698                                                  CurFuncDecl, LocalDeclMap,
699                                                  isLambdaConv);
700   blockFn = llvm::ConstantExpr::getBitCast(blockFn, VoidPtrTy);
701 
702   // If there is nothing to capture, we can emit this as a global block.
703   if (blockInfo.CanBeGlobal)
704     return buildGlobalBlock(CGM, blockInfo, blockFn);
705 
706   // Otherwise, we have to emit this as a local block.
707 
708   llvm::Constant *isa = CGM.getNSConcreteStackBlock();
709   isa = llvm::ConstantExpr::getBitCast(isa, VoidPtrTy);
710 
711   // Build the block descriptor.
712   llvm::Constant *descriptor = buildBlockDescriptor(CGM, blockInfo);
713 
714   llvm::AllocaInst *blockAddr = blockInfo.Address;
715   assert(blockAddr && "block has no address!");
716 
717   // Compute the initial on-stack block flags.
718   BlockFlags flags = BLOCK_HAS_SIGNATURE;
719   if (blockInfo.HasCapturedVariableLayout) flags |= BLOCK_HAS_EXTENDED_LAYOUT;
720   if (blockInfo.NeedsCopyDispose) flags |= BLOCK_HAS_COPY_DISPOSE;
721   if (blockInfo.HasCXXObject) flags |= BLOCK_HAS_CXX_OBJ;
722   if (blockInfo.UsesStret) flags |= BLOCK_USE_STRET;
723 
724   // Initialize the block literal.
725   Builder.CreateStore(isa, Builder.CreateStructGEP(blockAddr, 0, "block.isa"));
726   Builder.CreateStore(llvm::ConstantInt::get(IntTy, flags.getBitMask()),
727                       Builder.CreateStructGEP(blockAddr, 1, "block.flags"));
728   Builder.CreateStore(llvm::ConstantInt::get(IntTy, 0),
729                       Builder.CreateStructGEP(blockAddr, 2, "block.reserved"));
730   Builder.CreateStore(blockFn, Builder.CreateStructGEP(blockAddr, 3,
731                                                        "block.invoke"));
732   Builder.CreateStore(descriptor, Builder.CreateStructGEP(blockAddr, 4,
733                                                           "block.descriptor"));
734 
735   // Finally, capture all the values into the block.
736   const BlockDecl *blockDecl = blockInfo.getBlockDecl();
737 
738   // First, 'this'.
739   if (blockDecl->capturesCXXThis()) {
740     llvm::Value *addr = Builder.CreateStructGEP(blockAddr,
741                                                 blockInfo.CXXThisIndex,
742                                                 "block.captured-this.addr");
743     Builder.CreateStore(LoadCXXThis(), addr);
744   }
745 
746   // Next, captured variables.
747   for (BlockDecl::capture_const_iterator ci = blockDecl->capture_begin(),
748          ce = blockDecl->capture_end(); ci != ce; ++ci) {
749     const VarDecl *variable = ci->getVariable();
750     const CGBlockInfo::Capture &capture = blockInfo.getCapture(variable);
751 
752     // Ignore constant captures.
753     if (capture.isConstant()) continue;
754 
755     QualType type = variable->getType();
756     CharUnits align = getContext().getDeclAlign(variable);
757 
758     // This will be a [[type]]*, except that a byref entry will just be
759     // an i8**.
760     llvm::Value *blockField =
761       Builder.CreateStructGEP(blockAddr, capture.getIndex(),
762                               "block.captured");
763 
764     // Compute the address of the thing we're going to move into the
765     // block literal.
766     llvm::Value *src;
767     if (BlockInfo && ci->isNested()) {
768       // We need to use the capture from the enclosing block.
769       const CGBlockInfo::Capture &enclosingCapture =
770         BlockInfo->getCapture(variable);
771 
772       // This is a [[type]]*, except that a byref entry wil just be an i8**.
773       src = Builder.CreateStructGEP(LoadBlockStruct(),
774                                     enclosingCapture.getIndex(),
775                                     "block.capture.addr");
776     } else if (blockDecl->isConversionFromLambda()) {
777       // The lambda capture in a lambda's conversion-to-block-pointer is
778       // special; we'll simply emit it directly.
779       src = 0;
780     } else {
781       // Just look it up in the locals map, which will give us back a
782       // [[type]]*.  If that doesn't work, do the more elaborate DRE
783       // emission.
784       src = LocalDeclMap.lookup(variable);
785       if (!src) {
786         DeclRefExpr declRef(const_cast<VarDecl*>(variable),
787                             /*refersToEnclosing*/ ci->isNested(), type,
788                             VK_LValue, SourceLocation());
789         src = EmitDeclRefLValue(&declRef).getAddress();
790       }
791     }
792 
793     // For byrefs, we just write the pointer to the byref struct into
794     // the block field.  There's no need to chase the forwarding
795     // pointer at this point, since we're building something that will
796     // live a shorter life than the stack byref anyway.
797     if (ci->isByRef()) {
798       // Get a void* that points to the byref struct.
799       if (ci->isNested())
800         src = Builder.CreateAlignedLoad(src, align.getQuantity(),
801                                         "byref.capture");
802       else
803         src = Builder.CreateBitCast(src, VoidPtrTy);
804 
805       // Write that void* into the capture field.
806       Builder.CreateAlignedStore(src, blockField, align.getQuantity());
807 
808     // If we have a copy constructor, evaluate that into the block field.
809     } else if (const Expr *copyExpr = ci->getCopyExpr()) {
810       if (blockDecl->isConversionFromLambda()) {
811         // If we have a lambda conversion, emit the expression
812         // directly into the block instead.
813         AggValueSlot Slot =
814             AggValueSlot::forAddr(blockField, align, Qualifiers(),
815                                   AggValueSlot::IsDestructed,
816                                   AggValueSlot::DoesNotNeedGCBarriers,
817                                   AggValueSlot::IsNotAliased);
818         EmitAggExpr(copyExpr, Slot);
819       } else {
820         EmitSynthesizedCXXCopyCtor(blockField, src, copyExpr);
821       }
822 
823     // If it's a reference variable, copy the reference into the block field.
824     } else if (type->isReferenceType()) {
825       llvm::Value *ref =
826         Builder.CreateAlignedLoad(src, align.getQuantity(), "ref.val");
827       Builder.CreateAlignedStore(ref, blockField, align.getQuantity());
828 
829     // If this is an ARC __strong block-pointer variable, don't do a
830     // block copy.
831     //
832     // TODO: this can be generalized into the normal initialization logic:
833     // we should never need to do a block-copy when initializing a local
834     // variable, because the local variable's lifetime should be strictly
835     // contained within the stack block's.
836     } else if (type.getObjCLifetime() == Qualifiers::OCL_Strong &&
837                type->isBlockPointerType()) {
838       // Load the block and do a simple retain.
839       LValue srcLV = MakeAddrLValue(src, type, align);
840       llvm::Value *value = EmitLoadOfScalar(srcLV);
841       value = EmitARCRetainNonBlock(value);
842 
843       // Do a primitive store to the block field.
844       LValue destLV = MakeAddrLValue(blockField, type, align);
845       EmitStoreOfScalar(value, destLV, /*init*/ true);
846 
847     // Otherwise, fake up a POD copy into the block field.
848     } else {
849       // Fake up a new variable so that EmitScalarInit doesn't think
850       // we're referring to the variable in its own initializer.
851       ImplicitParamDecl blockFieldPseudoVar(/*DC*/ 0, SourceLocation(),
852                                             /*name*/ 0, type);
853 
854       // We use one of these or the other depending on whether the
855       // reference is nested.
856       DeclRefExpr declRef(const_cast<VarDecl*>(variable),
857                           /*refersToEnclosing*/ ci->isNested(), type,
858                           VK_LValue, SourceLocation());
859 
860       ImplicitCastExpr l2r(ImplicitCastExpr::OnStack, type, CK_LValueToRValue,
861                            &declRef, VK_RValue);
862       EmitExprAsInit(&l2r, &blockFieldPseudoVar,
863                      MakeAddrLValue(blockField, type, align),
864                      /*captured by init*/ false);
865     }
866 
867     // Activate the cleanup if layout pushed one.
868     if (!ci->isByRef()) {
869       EHScopeStack::stable_iterator cleanup = capture.getCleanup();
870       if (cleanup.isValid())
871         ActivateCleanupBlock(cleanup, blockInfo.DominatingIP);
872     }
873   }
874 
875   // Cast to the converted block-pointer type, which happens (somewhat
876   // unfortunately) to be a pointer to function type.
877   llvm::Value *result =
878     Builder.CreateBitCast(blockAddr,
879                           ConvertType(blockInfo.getBlockExpr()->getType()));
880 
881   return result;
882 }
883 
884 
885 llvm::Type *CodeGenModule::getBlockDescriptorType() {
886   if (BlockDescriptorType)
887     return BlockDescriptorType;
888 
889   llvm::Type *UnsignedLongTy =
890     getTypes().ConvertType(getContext().UnsignedLongTy);
891 
892   // struct __block_descriptor {
893   //   unsigned long reserved;
894   //   unsigned long block_size;
895   //
896   //   // later, the following will be added
897   //
898   //   struct {
899   //     void (*copyHelper)();
900   //     void (*copyHelper)();
901   //   } helpers;                // !!! optional
902   //
903   //   const char *signature;   // the block signature
904   //   const char *layout;      // reserved
905   // };
906   BlockDescriptorType =
907     llvm::StructType::create("struct.__block_descriptor",
908                              UnsignedLongTy, UnsignedLongTy, NULL);
909 
910   // Now form a pointer to that.
911   BlockDescriptorType = llvm::PointerType::getUnqual(BlockDescriptorType);
912   return BlockDescriptorType;
913 }
914 
915 llvm::Type *CodeGenModule::getGenericBlockLiteralType() {
916   if (GenericBlockLiteralType)
917     return GenericBlockLiteralType;
918 
919   llvm::Type *BlockDescPtrTy = getBlockDescriptorType();
920 
921   // struct __block_literal_generic {
922   //   void *__isa;
923   //   int __flags;
924   //   int __reserved;
925   //   void (*__invoke)(void *);
926   //   struct __block_descriptor *__descriptor;
927   // };
928   GenericBlockLiteralType =
929     llvm::StructType::create("struct.__block_literal_generic",
930                              VoidPtrTy, IntTy, IntTy, VoidPtrTy,
931                              BlockDescPtrTy, NULL);
932 
933   return GenericBlockLiteralType;
934 }
935 
936 
937 RValue CodeGenFunction::EmitBlockCallExpr(const CallExpr* E,
938                                           ReturnValueSlot ReturnValue) {
939   const BlockPointerType *BPT =
940     E->getCallee()->getType()->getAs<BlockPointerType>();
941 
942   llvm::Value *Callee = EmitScalarExpr(E->getCallee());
943 
944   // Get a pointer to the generic block literal.
945   llvm::Type *BlockLiteralTy =
946     llvm::PointerType::getUnqual(CGM.getGenericBlockLiteralType());
947 
948   // Bitcast the callee to a block literal.
949   llvm::Value *BlockLiteral =
950     Builder.CreateBitCast(Callee, BlockLiteralTy, "block.literal");
951 
952   // Get the function pointer from the literal.
953   llvm::Value *FuncPtr = Builder.CreateStructGEP(BlockLiteral, 3);
954 
955   BlockLiteral = Builder.CreateBitCast(BlockLiteral, VoidPtrTy);
956 
957   // Add the block literal.
958   CallArgList Args;
959   Args.add(RValue::get(BlockLiteral), getContext().VoidPtrTy);
960 
961   QualType FnType = BPT->getPointeeType();
962 
963   // And the rest of the arguments.
964   EmitCallArgs(Args, FnType->getAs<FunctionProtoType>(),
965                E->arg_begin(), E->arg_end());
966 
967   // Load the function.
968   llvm::Value *Func = Builder.CreateLoad(FuncPtr);
969 
970   const FunctionType *FuncTy = FnType->castAs<FunctionType>();
971   const CGFunctionInfo &FnInfo =
972     CGM.getTypes().arrangeBlockFunctionCall(Args, FuncTy);
973 
974   // Cast the function pointer to the right type.
975   llvm::Type *BlockFTy = CGM.getTypes().GetFunctionType(FnInfo);
976 
977   llvm::Type *BlockFTyPtr = llvm::PointerType::getUnqual(BlockFTy);
978   Func = Builder.CreateBitCast(Func, BlockFTyPtr);
979 
980   // And call the block.
981   return EmitCall(FnInfo, Func, ReturnValue, Args);
982 }
983 
984 llvm::Value *CodeGenFunction::GetAddrOfBlockDecl(const VarDecl *variable,
985                                                  bool isByRef) {
986   assert(BlockInfo && "evaluating block ref without block information?");
987   const CGBlockInfo::Capture &capture = BlockInfo->getCapture(variable);
988 
989   // Handle constant captures.
990   if (capture.isConstant()) return LocalDeclMap[variable];
991 
992   llvm::Value *addr =
993     Builder.CreateStructGEP(LoadBlockStruct(), capture.getIndex(),
994                             "block.capture.addr");
995 
996   if (isByRef) {
997     // addr should be a void** right now.  Load, then cast the result
998     // to byref*.
999 
1000     addr = Builder.CreateLoad(addr);
1001     llvm::PointerType *byrefPointerType
1002       = llvm::PointerType::get(BuildByRefType(variable), 0);
1003     addr = Builder.CreateBitCast(addr, byrefPointerType,
1004                                  "byref.addr");
1005 
1006     // Follow the forwarding pointer.
1007     addr = Builder.CreateStructGEP(addr, 1, "byref.forwarding");
1008     addr = Builder.CreateLoad(addr, "byref.addr.forwarded");
1009 
1010     // Cast back to byref* and GEP over to the actual object.
1011     addr = Builder.CreateBitCast(addr, byrefPointerType);
1012     addr = Builder.CreateStructGEP(addr, getByRefValueLLVMField(variable),
1013                                    variable->getNameAsString());
1014   }
1015 
1016   if (variable->getType()->isReferenceType())
1017     addr = Builder.CreateLoad(addr, "ref.tmp");
1018 
1019   return addr;
1020 }
1021 
1022 llvm::Constant *
1023 CodeGenModule::GetAddrOfGlobalBlock(const BlockExpr *blockExpr,
1024                                     const char *name) {
1025   CGBlockInfo blockInfo(blockExpr->getBlockDecl(), name);
1026   blockInfo.BlockExpression = blockExpr;
1027 
1028   // Compute information about the layout, etc., of this block.
1029   computeBlockInfo(*this, 0, blockInfo);
1030 
1031   // Using that metadata, generate the actual block function.
1032   llvm::Constant *blockFn;
1033   {
1034     llvm::DenseMap<const Decl*, llvm::Value*> LocalDeclMap;
1035     blockFn = CodeGenFunction(*this).GenerateBlockFunction(GlobalDecl(),
1036                                                            blockInfo,
1037                                                            0, LocalDeclMap,
1038                                                            false);
1039   }
1040   blockFn = llvm::ConstantExpr::getBitCast(blockFn, VoidPtrTy);
1041 
1042   return buildGlobalBlock(*this, blockInfo, blockFn);
1043 }
1044 
1045 static llvm::Constant *buildGlobalBlock(CodeGenModule &CGM,
1046                                         const CGBlockInfo &blockInfo,
1047                                         llvm::Constant *blockFn) {
1048   assert(blockInfo.CanBeGlobal);
1049 
1050   // Generate the constants for the block literal initializer.
1051   llvm::Constant *fields[BlockHeaderSize];
1052 
1053   // isa
1054   fields[0] = CGM.getNSConcreteGlobalBlock();
1055 
1056   // __flags
1057   BlockFlags flags = BLOCK_IS_GLOBAL | BLOCK_HAS_SIGNATURE;
1058   if (blockInfo.UsesStret) flags |= BLOCK_USE_STRET;
1059 
1060   fields[1] = llvm::ConstantInt::get(CGM.IntTy, flags.getBitMask());
1061 
1062   // Reserved
1063   fields[2] = llvm::Constant::getNullValue(CGM.IntTy);
1064 
1065   // Function
1066   fields[3] = blockFn;
1067 
1068   // Descriptor
1069   fields[4] = buildBlockDescriptor(CGM, blockInfo);
1070 
1071   llvm::Constant *init = llvm::ConstantStruct::getAnon(fields);
1072 
1073   llvm::GlobalVariable *literal =
1074     new llvm::GlobalVariable(CGM.getModule(),
1075                              init->getType(),
1076                              /*constant*/ true,
1077                              llvm::GlobalVariable::InternalLinkage,
1078                              init,
1079                              "__block_literal_global");
1080   literal->setAlignment(blockInfo.BlockAlign.getQuantity());
1081 
1082   // Return a constant of the appropriately-casted type.
1083   llvm::Type *requiredType =
1084     CGM.getTypes().ConvertType(blockInfo.getBlockExpr()->getType());
1085   return llvm::ConstantExpr::getBitCast(literal, requiredType);
1086 }
1087 
1088 llvm::Function *
1089 CodeGenFunction::GenerateBlockFunction(GlobalDecl GD,
1090                                        const CGBlockInfo &blockInfo,
1091                                        const Decl *outerFnDecl,
1092                                        const DeclMapTy &ldm,
1093                                        bool IsLambdaConversionToBlock) {
1094   const BlockDecl *blockDecl = blockInfo.getBlockDecl();
1095 
1096   // Check if we should generate debug info for this block function.
1097   maybeInitializeDebugInfo();
1098   CurGD = GD;
1099 
1100   BlockInfo = &blockInfo;
1101 
1102   // Arrange for local static and local extern declarations to appear
1103   // to be local to this function as well, in case they're directly
1104   // referenced in a block.
1105   for (DeclMapTy::const_iterator i = ldm.begin(), e = ldm.end(); i != e; ++i) {
1106     const VarDecl *var = dyn_cast<VarDecl>(i->first);
1107     if (var && !var->hasLocalStorage())
1108       LocalDeclMap[var] = i->second;
1109   }
1110 
1111   // Begin building the function declaration.
1112 
1113   // Build the argument list.
1114   FunctionArgList args;
1115 
1116   // The first argument is the block pointer.  Just take it as a void*
1117   // and cast it later.
1118   QualType selfTy = getContext().VoidPtrTy;
1119   IdentifierInfo *II = &CGM.getContext().Idents.get(".block_descriptor");
1120 
1121   ImplicitParamDecl selfDecl(const_cast<BlockDecl*>(blockDecl),
1122                              SourceLocation(), II, selfTy);
1123   args.push_back(&selfDecl);
1124 
1125   // Now add the rest of the parameters.
1126   for (BlockDecl::param_const_iterator i = blockDecl->param_begin(),
1127        e = blockDecl->param_end(); i != e; ++i)
1128     args.push_back(*i);
1129 
1130   // Create the function declaration.
1131   const FunctionProtoType *fnType = blockInfo.getBlockExpr()->getFunctionType();
1132   const CGFunctionInfo &fnInfo =
1133     CGM.getTypes().arrangeFunctionDeclaration(fnType->getResultType(), args,
1134                                               fnType->getExtInfo(),
1135                                               fnType->isVariadic());
1136   if (CGM.ReturnTypeUsesSRet(fnInfo))
1137     blockInfo.UsesStret = true;
1138 
1139   llvm::FunctionType *fnLLVMType = CGM.getTypes().GetFunctionType(fnInfo);
1140 
1141   MangleBuffer name;
1142   CGM.getBlockMangledName(GD, name, blockDecl);
1143   llvm::Function *fn =
1144     llvm::Function::Create(fnLLVMType, llvm::GlobalValue::InternalLinkage,
1145                            name.getString(), &CGM.getModule());
1146   CGM.SetInternalFunctionAttributes(blockDecl, fn, fnInfo);
1147 
1148   // Begin generating the function.
1149   StartFunction(blockDecl, fnType->getResultType(), fn, fnInfo, args,
1150                 blockInfo.getBlockExpr()->getBody()->getLocStart());
1151   CurFuncDecl = outerFnDecl; // StartFunction sets this to blockDecl
1152 
1153   // Okay.  Undo some of what StartFunction did.
1154 
1155   // Pull the 'self' reference out of the local decl map.
1156   llvm::Value *blockAddr = LocalDeclMap[&selfDecl];
1157   LocalDeclMap.erase(&selfDecl);
1158   BlockPointer = Builder.CreateBitCast(blockAddr,
1159                                        blockInfo.StructureType->getPointerTo(),
1160                                        "block");
1161   // At -O0 we generate an explicit alloca for the BlockPointer, so the RA
1162   // won't delete the dbg.declare intrinsics for captured variables.
1163   llvm::Value *BlockPointerDbgLoc = BlockPointer;
1164   if (CGM.getCodeGenOpts().OptimizationLevel == 0) {
1165     // Allocate a stack slot for it, so we can point the debugger to it
1166     llvm::AllocaInst *Alloca = CreateTempAlloca(BlockPointer->getType(),
1167                                                 "block.addr");
1168     unsigned Align = getContext().getDeclAlign(&selfDecl).getQuantity();
1169     Alloca->setAlignment(Align);
1170     // Set the DebugLocation to empty, so the store is recognized as a
1171     // frame setup instruction by llvm::DwarfDebug::beginFunction().
1172     Builder.DisableDebugLocations();
1173     Builder.CreateAlignedStore(BlockPointer, Alloca, Align);
1174     Builder.EnableDebugLocations();
1175     BlockPointerDbgLoc = Alloca;
1176   }
1177 
1178   // If we have a C++ 'this' reference, go ahead and force it into
1179   // existence now.
1180   if (blockDecl->capturesCXXThis()) {
1181     llvm::Value *addr = Builder.CreateStructGEP(BlockPointer,
1182                                                 blockInfo.CXXThisIndex,
1183                                                 "block.captured-this");
1184     CXXThisValue = Builder.CreateLoad(addr, "this");
1185   }
1186 
1187   // LoadObjCSelf() expects there to be an entry for 'self' in LocalDeclMap;
1188   // appease it.
1189   if (const ObjCMethodDecl *method
1190         = dyn_cast_or_null<ObjCMethodDecl>(CurFuncDecl)) {
1191     const VarDecl *self = method->getSelfDecl();
1192 
1193     // There might not be a capture for 'self', but if there is...
1194     if (blockInfo.Captures.count(self)) {
1195       const CGBlockInfo::Capture &capture = blockInfo.getCapture(self);
1196 
1197       llvm::Value *selfAddr = Builder.CreateStructGEP(BlockPointer,
1198                                                       capture.getIndex(),
1199                                                       "block.captured-self");
1200       LocalDeclMap[self] = selfAddr;
1201     }
1202   }
1203 
1204   // Also force all the constant captures.
1205   for (BlockDecl::capture_const_iterator ci = blockDecl->capture_begin(),
1206          ce = blockDecl->capture_end(); ci != ce; ++ci) {
1207     const VarDecl *variable = ci->getVariable();
1208     const CGBlockInfo::Capture &capture = blockInfo.getCapture(variable);
1209     if (!capture.isConstant()) continue;
1210 
1211     unsigned align = getContext().getDeclAlign(variable).getQuantity();
1212 
1213     llvm::AllocaInst *alloca =
1214       CreateMemTemp(variable->getType(), "block.captured-const");
1215     alloca->setAlignment(align);
1216 
1217     Builder.CreateAlignedStore(capture.getConstant(), alloca, align);
1218 
1219     LocalDeclMap[variable] = alloca;
1220   }
1221 
1222   // Save a spot to insert the debug information for all the DeclRefExprs.
1223   llvm::BasicBlock *entry = Builder.GetInsertBlock();
1224   llvm::BasicBlock::iterator entry_ptr = Builder.GetInsertPoint();
1225   --entry_ptr;
1226 
1227   if (IsLambdaConversionToBlock)
1228     EmitLambdaBlockInvokeBody();
1229   else
1230     EmitStmt(blockDecl->getBody());
1231 
1232   // Remember where we were...
1233   llvm::BasicBlock *resume = Builder.GetInsertBlock();
1234 
1235   // Go back to the entry.
1236   ++entry_ptr;
1237   Builder.SetInsertPoint(entry, entry_ptr);
1238 
1239   // Emit debug information for all the DeclRefExprs.
1240   // FIXME: also for 'this'
1241   if (CGDebugInfo *DI = getDebugInfo()) {
1242     for (BlockDecl::capture_const_iterator ci = blockDecl->capture_begin(),
1243            ce = blockDecl->capture_end(); ci != ce; ++ci) {
1244       const VarDecl *variable = ci->getVariable();
1245       DI->EmitLocation(Builder, variable->getLocation());
1246 
1247       if (CGM.getCodeGenOpts().getDebugInfo()
1248             >= CodeGenOptions::LimitedDebugInfo) {
1249         const CGBlockInfo::Capture &capture = blockInfo.getCapture(variable);
1250         if (capture.isConstant()) {
1251           DI->EmitDeclareOfAutoVariable(variable, LocalDeclMap[variable],
1252                                         Builder);
1253           continue;
1254         }
1255 
1256         DI->EmitDeclareOfBlockDeclRefVariable(variable, BlockPointerDbgLoc,
1257                                               Builder, blockInfo);
1258       }
1259     }
1260     // Recover location if it was changed in the above loop.
1261     DI->EmitLocation(Builder,
1262                      cast<CompoundStmt>(blockDecl->getBody())->getRBracLoc());
1263   }
1264 
1265   // And resume where we left off.
1266   if (resume == 0)
1267     Builder.ClearInsertionPoint();
1268   else
1269     Builder.SetInsertPoint(resume);
1270 
1271   FinishFunction(cast<CompoundStmt>(blockDecl->getBody())->getRBracLoc());
1272 
1273   return fn;
1274 }
1275 
1276 /*
1277     notes.push_back(HelperInfo());
1278     HelperInfo &note = notes.back();
1279     note.index = capture.getIndex();
1280     note.RequiresCopying = (ci->hasCopyExpr() || BlockRequiresCopying(type));
1281     note.cxxbar_import = ci->getCopyExpr();
1282 
1283     if (ci->isByRef()) {
1284       note.flag = BLOCK_FIELD_IS_BYREF;
1285       if (type.isObjCGCWeak())
1286         note.flag |= BLOCK_FIELD_IS_WEAK;
1287     } else if (type->isBlockPointerType()) {
1288       note.flag = BLOCK_FIELD_IS_BLOCK;
1289     } else {
1290       note.flag = BLOCK_FIELD_IS_OBJECT;
1291     }
1292  */
1293 
1294 
1295 /// Generate the copy-helper function for a block closure object:
1296 ///   static void block_copy_helper(block_t *dst, block_t *src);
1297 /// The runtime will have previously initialized 'dst' by doing a
1298 /// bit-copy of 'src'.
1299 ///
1300 /// Note that this copies an entire block closure object to the heap;
1301 /// it should not be confused with a 'byref copy helper', which moves
1302 /// the contents of an individual __block variable to the heap.
1303 llvm::Constant *
1304 CodeGenFunction::GenerateCopyHelperFunction(const CGBlockInfo &blockInfo) {
1305   ASTContext &C = getContext();
1306 
1307   FunctionArgList args;
1308   ImplicitParamDecl dstDecl(0, SourceLocation(), 0, C.VoidPtrTy);
1309   args.push_back(&dstDecl);
1310   ImplicitParamDecl srcDecl(0, SourceLocation(), 0, C.VoidPtrTy);
1311   args.push_back(&srcDecl);
1312 
1313   const CGFunctionInfo &FI =
1314     CGM.getTypes().arrangeFunctionDeclaration(C.VoidTy, args,
1315                                               FunctionType::ExtInfo(),
1316                                               /*variadic*/ false);
1317 
1318   // FIXME: it would be nice if these were mergeable with things with
1319   // identical semantics.
1320   llvm::FunctionType *LTy = CGM.getTypes().GetFunctionType(FI);
1321 
1322   llvm::Function *Fn =
1323     llvm::Function::Create(LTy, llvm::GlobalValue::InternalLinkage,
1324                            "__copy_helper_block_", &CGM.getModule());
1325 
1326   IdentifierInfo *II
1327     = &CGM.getContext().Idents.get("__copy_helper_block_");
1328 
1329   // Check if we should generate debug info for this block helper function.
1330   maybeInitializeDebugInfo();
1331 
1332   FunctionDecl *FD = FunctionDecl::Create(C,
1333                                           C.getTranslationUnitDecl(),
1334                                           SourceLocation(),
1335                                           SourceLocation(), II, C.VoidTy, 0,
1336                                           SC_Static,
1337                                           false,
1338                                           false);
1339   StartFunction(FD, C.VoidTy, Fn, FI, args, SourceLocation());
1340 
1341   llvm::Type *structPtrTy = blockInfo.StructureType->getPointerTo();
1342 
1343   llvm::Value *src = GetAddrOfLocalVar(&srcDecl);
1344   src = Builder.CreateLoad(src);
1345   src = Builder.CreateBitCast(src, structPtrTy, "block.source");
1346 
1347   llvm::Value *dst = GetAddrOfLocalVar(&dstDecl);
1348   dst = Builder.CreateLoad(dst);
1349   dst = Builder.CreateBitCast(dst, structPtrTy, "block.dest");
1350 
1351   const BlockDecl *blockDecl = blockInfo.getBlockDecl();
1352 
1353   for (BlockDecl::capture_const_iterator ci = blockDecl->capture_begin(),
1354          ce = blockDecl->capture_end(); ci != ce; ++ci) {
1355     const VarDecl *variable = ci->getVariable();
1356     QualType type = variable->getType();
1357 
1358     const CGBlockInfo::Capture &capture = blockInfo.getCapture(variable);
1359     if (capture.isConstant()) continue;
1360 
1361     const Expr *copyExpr = ci->getCopyExpr();
1362     BlockFieldFlags flags;
1363 
1364     bool useARCWeakCopy = false;
1365     bool useARCStrongCopy = false;
1366 
1367     if (copyExpr) {
1368       assert(!ci->isByRef());
1369       // don't bother computing flags
1370 
1371     } else if (ci->isByRef()) {
1372       flags = BLOCK_FIELD_IS_BYREF;
1373       if (type.isObjCGCWeak())
1374         flags |= BLOCK_FIELD_IS_WEAK;
1375 
1376     } else if (type->isObjCRetainableType()) {
1377       flags = BLOCK_FIELD_IS_OBJECT;
1378       bool isBlockPointer = type->isBlockPointerType();
1379       if (isBlockPointer)
1380         flags = BLOCK_FIELD_IS_BLOCK;
1381 
1382       // Special rules for ARC captures:
1383       if (getLangOpts().ObjCAutoRefCount) {
1384         Qualifiers qs = type.getQualifiers();
1385 
1386         // We need to register __weak direct captures with the runtime.
1387         if (qs.getObjCLifetime() == Qualifiers::OCL_Weak) {
1388           useARCWeakCopy = true;
1389 
1390         // We need to retain the copied value for __strong direct captures.
1391         } else if (qs.getObjCLifetime() == Qualifiers::OCL_Strong) {
1392           // If it's a block pointer, we have to copy the block and
1393           // assign that to the destination pointer, so we might as
1394           // well use _Block_object_assign.  Otherwise we can avoid that.
1395           if (!isBlockPointer)
1396             useARCStrongCopy = true;
1397 
1398         // Otherwise the memcpy is fine.
1399         } else {
1400           continue;
1401         }
1402 
1403       // Non-ARC captures of retainable pointers are strong and
1404       // therefore require a call to _Block_object_assign.
1405       } else {
1406         // fall through
1407       }
1408     } else {
1409       continue;
1410     }
1411 
1412     unsigned index = capture.getIndex();
1413     llvm::Value *srcField = Builder.CreateStructGEP(src, index);
1414     llvm::Value *dstField = Builder.CreateStructGEP(dst, index);
1415 
1416     // If there's an explicit copy expression, we do that.
1417     if (copyExpr) {
1418       EmitSynthesizedCXXCopyCtor(dstField, srcField, copyExpr);
1419     } else if (useARCWeakCopy) {
1420       EmitARCCopyWeak(dstField, srcField);
1421     } else {
1422       llvm::Value *srcValue = Builder.CreateLoad(srcField, "blockcopy.src");
1423       if (useARCStrongCopy) {
1424         // At -O0, store null into the destination field (so that the
1425         // storeStrong doesn't over-release) and then call storeStrong.
1426         // This is a workaround to not having an initStrong call.
1427         if (CGM.getCodeGenOpts().OptimizationLevel == 0) {
1428           llvm::PointerType *ty = cast<llvm::PointerType>(srcValue->getType());
1429           llvm::Value *null = llvm::ConstantPointerNull::get(ty);
1430           Builder.CreateStore(null, dstField);
1431           EmitARCStoreStrongCall(dstField, srcValue, true);
1432 
1433         // With optimization enabled, take advantage of the fact that
1434         // the blocks runtime guarantees a memcpy of the block data, and
1435         // just emit a retain of the src field.
1436         } else {
1437           EmitARCRetainNonBlock(srcValue);
1438 
1439           // We don't need this anymore, so kill it.  It's not quite
1440           // worth the annoyance to avoid creating it in the first place.
1441           cast<llvm::Instruction>(dstField)->eraseFromParent();
1442         }
1443       } else {
1444         srcValue = Builder.CreateBitCast(srcValue, VoidPtrTy);
1445         llvm::Value *dstAddr = Builder.CreateBitCast(dstField, VoidPtrTy);
1446         llvm::Value *args[] = {
1447           dstAddr, srcValue, llvm::ConstantInt::get(Int32Ty, flags.getBitMask())
1448         };
1449 
1450         bool copyCanThrow = false;
1451         if (ci->isByRef() && variable->getType()->getAsCXXRecordDecl()) {
1452           const Expr *copyExpr =
1453             CGM.getContext().getBlockVarCopyInits(variable);
1454           if (copyExpr) {
1455             copyCanThrow = true; // FIXME: reuse the noexcept logic
1456           }
1457         }
1458 
1459         if (copyCanThrow) {
1460           EmitRuntimeCallOrInvoke(CGM.getBlockObjectAssign(), args);
1461         } else {
1462           EmitNounwindRuntimeCall(CGM.getBlockObjectAssign(), args);
1463         }
1464       }
1465     }
1466   }
1467 
1468   FinishFunction();
1469 
1470   return llvm::ConstantExpr::getBitCast(Fn, VoidPtrTy);
1471 }
1472 
1473 /// Generate the destroy-helper function for a block closure object:
1474 ///   static void block_destroy_helper(block_t *theBlock);
1475 ///
1476 /// Note that this destroys a heap-allocated block closure object;
1477 /// it should not be confused with a 'byref destroy helper', which
1478 /// destroys the heap-allocated contents of an individual __block
1479 /// variable.
1480 llvm::Constant *
1481 CodeGenFunction::GenerateDestroyHelperFunction(const CGBlockInfo &blockInfo) {
1482   ASTContext &C = getContext();
1483 
1484   FunctionArgList args;
1485   ImplicitParamDecl srcDecl(0, SourceLocation(), 0, C.VoidPtrTy);
1486   args.push_back(&srcDecl);
1487 
1488   const CGFunctionInfo &FI =
1489     CGM.getTypes().arrangeFunctionDeclaration(C.VoidTy, args,
1490                                               FunctionType::ExtInfo(),
1491                                               /*variadic*/ false);
1492 
1493   // FIXME: We'd like to put these into a mergable by content, with
1494   // internal linkage.
1495   llvm::FunctionType *LTy = CGM.getTypes().GetFunctionType(FI);
1496 
1497   llvm::Function *Fn =
1498     llvm::Function::Create(LTy, llvm::GlobalValue::InternalLinkage,
1499                            "__destroy_helper_block_", &CGM.getModule());
1500 
1501   // Check if we should generate debug info for this block destroy function.
1502   maybeInitializeDebugInfo();
1503 
1504   IdentifierInfo *II
1505     = &CGM.getContext().Idents.get("__destroy_helper_block_");
1506 
1507   FunctionDecl *FD = FunctionDecl::Create(C, C.getTranslationUnitDecl(),
1508                                           SourceLocation(),
1509                                           SourceLocation(), II, C.VoidTy, 0,
1510                                           SC_Static,
1511                                           false, false);
1512   StartFunction(FD, C.VoidTy, Fn, FI, args, SourceLocation());
1513 
1514   llvm::Type *structPtrTy = blockInfo.StructureType->getPointerTo();
1515 
1516   llvm::Value *src = GetAddrOfLocalVar(&srcDecl);
1517   src = Builder.CreateLoad(src);
1518   src = Builder.CreateBitCast(src, structPtrTy, "block");
1519 
1520   const BlockDecl *blockDecl = blockInfo.getBlockDecl();
1521 
1522   CodeGenFunction::RunCleanupsScope cleanups(*this);
1523 
1524   for (BlockDecl::capture_const_iterator ci = blockDecl->capture_begin(),
1525          ce = blockDecl->capture_end(); ci != ce; ++ci) {
1526     const VarDecl *variable = ci->getVariable();
1527     QualType type = variable->getType();
1528 
1529     const CGBlockInfo::Capture &capture = blockInfo.getCapture(variable);
1530     if (capture.isConstant()) continue;
1531 
1532     BlockFieldFlags flags;
1533     const CXXDestructorDecl *dtor = 0;
1534 
1535     bool useARCWeakDestroy = false;
1536     bool useARCStrongDestroy = false;
1537 
1538     if (ci->isByRef()) {
1539       flags = BLOCK_FIELD_IS_BYREF;
1540       if (type.isObjCGCWeak())
1541         flags |= BLOCK_FIELD_IS_WEAK;
1542     } else if (const CXXRecordDecl *record = type->getAsCXXRecordDecl()) {
1543       if (record->hasTrivialDestructor())
1544         continue;
1545       dtor = record->getDestructor();
1546     } else if (type->isObjCRetainableType()) {
1547       flags = BLOCK_FIELD_IS_OBJECT;
1548       if (type->isBlockPointerType())
1549         flags = BLOCK_FIELD_IS_BLOCK;
1550 
1551       // Special rules for ARC captures.
1552       if (getLangOpts().ObjCAutoRefCount) {
1553         Qualifiers qs = type.getQualifiers();
1554 
1555         // Don't generate special dispose logic for a captured object
1556         // unless it's __strong or __weak.
1557         if (!qs.hasStrongOrWeakObjCLifetime())
1558           continue;
1559 
1560         // Support __weak direct captures.
1561         if (qs.getObjCLifetime() == Qualifiers::OCL_Weak)
1562           useARCWeakDestroy = true;
1563 
1564         // Tools really want us to use objc_storeStrong here.
1565         else
1566           useARCStrongDestroy = true;
1567       }
1568     } else {
1569       continue;
1570     }
1571 
1572     unsigned index = capture.getIndex();
1573     llvm::Value *srcField = Builder.CreateStructGEP(src, index);
1574 
1575     // If there's an explicit copy expression, we do that.
1576     if (dtor) {
1577       PushDestructorCleanup(dtor, srcField);
1578 
1579     // If this is a __weak capture, emit the release directly.
1580     } else if (useARCWeakDestroy) {
1581       EmitARCDestroyWeak(srcField);
1582 
1583     // Destroy strong objects with a call if requested.
1584     } else if (useARCStrongDestroy) {
1585       EmitARCDestroyStrong(srcField, ARCImpreciseLifetime);
1586 
1587     // Otherwise we call _Block_object_dispose.  It wouldn't be too
1588     // hard to just emit this as a cleanup if we wanted to make sure
1589     // that things were done in reverse.
1590     } else {
1591       llvm::Value *value = Builder.CreateLoad(srcField);
1592       value = Builder.CreateBitCast(value, VoidPtrTy);
1593       BuildBlockRelease(value, flags);
1594     }
1595   }
1596 
1597   cleanups.ForceCleanup();
1598 
1599   FinishFunction();
1600 
1601   return llvm::ConstantExpr::getBitCast(Fn, VoidPtrTy);
1602 }
1603 
1604 namespace {
1605 
1606 /// Emits the copy/dispose helper functions for a __block object of id type.
1607 class ObjectByrefHelpers : public CodeGenModule::ByrefHelpers {
1608   BlockFieldFlags Flags;
1609 
1610 public:
1611   ObjectByrefHelpers(CharUnits alignment, BlockFieldFlags flags)
1612     : ByrefHelpers(alignment), Flags(flags) {}
1613 
1614   void emitCopy(CodeGenFunction &CGF, llvm::Value *destField,
1615                 llvm::Value *srcField) {
1616     destField = CGF.Builder.CreateBitCast(destField, CGF.VoidPtrTy);
1617 
1618     srcField = CGF.Builder.CreateBitCast(srcField, CGF.VoidPtrPtrTy);
1619     llvm::Value *srcValue = CGF.Builder.CreateLoad(srcField);
1620 
1621     unsigned flags = (Flags | BLOCK_BYREF_CALLER).getBitMask();
1622 
1623     llvm::Value *flagsVal = llvm::ConstantInt::get(CGF.Int32Ty, flags);
1624     llvm::Value *fn = CGF.CGM.getBlockObjectAssign();
1625 
1626     llvm::Value *args[] = { destField, srcValue, flagsVal };
1627     CGF.EmitNounwindRuntimeCall(fn, args);
1628   }
1629 
1630   void emitDispose(CodeGenFunction &CGF, llvm::Value *field) {
1631     field = CGF.Builder.CreateBitCast(field, CGF.Int8PtrTy->getPointerTo(0));
1632     llvm::Value *value = CGF.Builder.CreateLoad(field);
1633 
1634     CGF.BuildBlockRelease(value, Flags | BLOCK_BYREF_CALLER);
1635   }
1636 
1637   void profileImpl(llvm::FoldingSetNodeID &id) const {
1638     id.AddInteger(Flags.getBitMask());
1639   }
1640 };
1641 
1642 /// Emits the copy/dispose helpers for an ARC __block __weak variable.
1643 class ARCWeakByrefHelpers : public CodeGenModule::ByrefHelpers {
1644 public:
1645   ARCWeakByrefHelpers(CharUnits alignment) : ByrefHelpers(alignment) {}
1646 
1647   void emitCopy(CodeGenFunction &CGF, llvm::Value *destField,
1648                 llvm::Value *srcField) {
1649     CGF.EmitARCMoveWeak(destField, srcField);
1650   }
1651 
1652   void emitDispose(CodeGenFunction &CGF, llvm::Value *field) {
1653     CGF.EmitARCDestroyWeak(field);
1654   }
1655 
1656   void profileImpl(llvm::FoldingSetNodeID &id) const {
1657     // 0 is distinguishable from all pointers and byref flags
1658     id.AddInteger(0);
1659   }
1660 };
1661 
1662 /// Emits the copy/dispose helpers for an ARC __block __strong variable
1663 /// that's not of block-pointer type.
1664 class ARCStrongByrefHelpers : public CodeGenModule::ByrefHelpers {
1665 public:
1666   ARCStrongByrefHelpers(CharUnits alignment) : ByrefHelpers(alignment) {}
1667 
1668   void emitCopy(CodeGenFunction &CGF, llvm::Value *destField,
1669                 llvm::Value *srcField) {
1670     // Do a "move" by copying the value and then zeroing out the old
1671     // variable.
1672 
1673     llvm::LoadInst *value = CGF.Builder.CreateLoad(srcField);
1674     value->setAlignment(Alignment.getQuantity());
1675 
1676     llvm::Value *null =
1677       llvm::ConstantPointerNull::get(cast<llvm::PointerType>(value->getType()));
1678 
1679     if (CGF.CGM.getCodeGenOpts().OptimizationLevel == 0) {
1680       llvm::StoreInst *store = CGF.Builder.CreateStore(null, destField);
1681       store->setAlignment(Alignment.getQuantity());
1682       CGF.EmitARCStoreStrongCall(destField, value, /*ignored*/ true);
1683       CGF.EmitARCStoreStrongCall(srcField, null, /*ignored*/ true);
1684       return;
1685     }
1686     llvm::StoreInst *store = CGF.Builder.CreateStore(value, destField);
1687     store->setAlignment(Alignment.getQuantity());
1688 
1689     store = CGF.Builder.CreateStore(null, srcField);
1690     store->setAlignment(Alignment.getQuantity());
1691   }
1692 
1693   void emitDispose(CodeGenFunction &CGF, llvm::Value *field) {
1694     CGF.EmitARCDestroyStrong(field, ARCImpreciseLifetime);
1695   }
1696 
1697   void profileImpl(llvm::FoldingSetNodeID &id) const {
1698     // 1 is distinguishable from all pointers and byref flags
1699     id.AddInteger(1);
1700   }
1701 };
1702 
1703 /// Emits the copy/dispose helpers for an ARC __block __strong
1704 /// variable that's of block-pointer type.
1705 class ARCStrongBlockByrefHelpers : public CodeGenModule::ByrefHelpers {
1706 public:
1707   ARCStrongBlockByrefHelpers(CharUnits alignment) : ByrefHelpers(alignment) {}
1708 
1709   void emitCopy(CodeGenFunction &CGF, llvm::Value *destField,
1710                 llvm::Value *srcField) {
1711     // Do the copy with objc_retainBlock; that's all that
1712     // _Block_object_assign would do anyway, and we'd have to pass the
1713     // right arguments to make sure it doesn't get no-op'ed.
1714     llvm::LoadInst *oldValue = CGF.Builder.CreateLoad(srcField);
1715     oldValue->setAlignment(Alignment.getQuantity());
1716 
1717     llvm::Value *copy = CGF.EmitARCRetainBlock(oldValue, /*mandatory*/ true);
1718 
1719     llvm::StoreInst *store = CGF.Builder.CreateStore(copy, destField);
1720     store->setAlignment(Alignment.getQuantity());
1721   }
1722 
1723   void emitDispose(CodeGenFunction &CGF, llvm::Value *field) {
1724     CGF.EmitARCDestroyStrong(field, ARCImpreciseLifetime);
1725   }
1726 
1727   void profileImpl(llvm::FoldingSetNodeID &id) const {
1728     // 2 is distinguishable from all pointers and byref flags
1729     id.AddInteger(2);
1730   }
1731 };
1732 
1733 /// Emits the copy/dispose helpers for a __block variable with a
1734 /// nontrivial copy constructor or destructor.
1735 class CXXByrefHelpers : public CodeGenModule::ByrefHelpers {
1736   QualType VarType;
1737   const Expr *CopyExpr;
1738 
1739 public:
1740   CXXByrefHelpers(CharUnits alignment, QualType type,
1741                   const Expr *copyExpr)
1742     : ByrefHelpers(alignment), VarType(type), CopyExpr(copyExpr) {}
1743 
1744   bool needsCopy() const { return CopyExpr != 0; }
1745   void emitCopy(CodeGenFunction &CGF, llvm::Value *destField,
1746                 llvm::Value *srcField) {
1747     if (!CopyExpr) return;
1748     CGF.EmitSynthesizedCXXCopyCtor(destField, srcField, CopyExpr);
1749   }
1750 
1751   void emitDispose(CodeGenFunction &CGF, llvm::Value *field) {
1752     EHScopeStack::stable_iterator cleanupDepth = CGF.EHStack.stable_begin();
1753     CGF.PushDestructorCleanup(VarType, field);
1754     CGF.PopCleanupBlocks(cleanupDepth);
1755   }
1756 
1757   void profileImpl(llvm::FoldingSetNodeID &id) const {
1758     id.AddPointer(VarType.getCanonicalType().getAsOpaquePtr());
1759   }
1760 };
1761 } // end anonymous namespace
1762 
1763 static llvm::Constant *
1764 generateByrefCopyHelper(CodeGenFunction &CGF,
1765                         llvm::StructType &byrefType,
1766                         unsigned valueFieldIndex,
1767                         CodeGenModule::ByrefHelpers &byrefInfo) {
1768   ASTContext &Context = CGF.getContext();
1769 
1770   QualType R = Context.VoidTy;
1771 
1772   FunctionArgList args;
1773   ImplicitParamDecl dst(0, SourceLocation(), 0, Context.VoidPtrTy);
1774   args.push_back(&dst);
1775 
1776   ImplicitParamDecl src(0, SourceLocation(), 0, Context.VoidPtrTy);
1777   args.push_back(&src);
1778 
1779   const CGFunctionInfo &FI =
1780     CGF.CGM.getTypes().arrangeFunctionDeclaration(R, args,
1781                                                   FunctionType::ExtInfo(),
1782                                                   /*variadic*/ false);
1783 
1784   CodeGenTypes &Types = CGF.CGM.getTypes();
1785   llvm::FunctionType *LTy = Types.GetFunctionType(FI);
1786 
1787   // FIXME: We'd like to put these into a mergable by content, with
1788   // internal linkage.
1789   llvm::Function *Fn =
1790     llvm::Function::Create(LTy, llvm::GlobalValue::InternalLinkage,
1791                            "__Block_byref_object_copy_", &CGF.CGM.getModule());
1792 
1793   IdentifierInfo *II
1794     = &Context.Idents.get("__Block_byref_object_copy_");
1795 
1796   FunctionDecl *FD = FunctionDecl::Create(Context,
1797                                           Context.getTranslationUnitDecl(),
1798                                           SourceLocation(),
1799                                           SourceLocation(), II, R, 0,
1800                                           SC_Static,
1801                                           false, false);
1802 
1803   // Initialize debug info if necessary.
1804   CGF.maybeInitializeDebugInfo();
1805   CGF.StartFunction(FD, R, Fn, FI, args, SourceLocation());
1806 
1807   if (byrefInfo.needsCopy()) {
1808     llvm::Type *byrefPtrType = byrefType.getPointerTo(0);
1809 
1810     // dst->x
1811     llvm::Value *destField = CGF.GetAddrOfLocalVar(&dst);
1812     destField = CGF.Builder.CreateLoad(destField);
1813     destField = CGF.Builder.CreateBitCast(destField, byrefPtrType);
1814     destField = CGF.Builder.CreateStructGEP(destField, valueFieldIndex, "x");
1815 
1816     // src->x
1817     llvm::Value *srcField = CGF.GetAddrOfLocalVar(&src);
1818     srcField = CGF.Builder.CreateLoad(srcField);
1819     srcField = CGF.Builder.CreateBitCast(srcField, byrefPtrType);
1820     srcField = CGF.Builder.CreateStructGEP(srcField, valueFieldIndex, "x");
1821 
1822     byrefInfo.emitCopy(CGF, destField, srcField);
1823   }
1824 
1825   CGF.FinishFunction();
1826 
1827   return llvm::ConstantExpr::getBitCast(Fn, CGF.Int8PtrTy);
1828 }
1829 
1830 /// Build the copy helper for a __block variable.
1831 static llvm::Constant *buildByrefCopyHelper(CodeGenModule &CGM,
1832                                             llvm::StructType &byrefType,
1833                                             unsigned byrefValueIndex,
1834                                             CodeGenModule::ByrefHelpers &info) {
1835   CodeGenFunction CGF(CGM);
1836   return generateByrefCopyHelper(CGF, byrefType, byrefValueIndex, info);
1837 }
1838 
1839 /// Generate code for a __block variable's dispose helper.
1840 static llvm::Constant *
1841 generateByrefDisposeHelper(CodeGenFunction &CGF,
1842                            llvm::StructType &byrefType,
1843                            unsigned byrefValueIndex,
1844                            CodeGenModule::ByrefHelpers &byrefInfo) {
1845   ASTContext &Context = CGF.getContext();
1846   QualType R = Context.VoidTy;
1847 
1848   FunctionArgList args;
1849   ImplicitParamDecl src(0, SourceLocation(), 0, Context.VoidPtrTy);
1850   args.push_back(&src);
1851 
1852   const CGFunctionInfo &FI =
1853     CGF.CGM.getTypes().arrangeFunctionDeclaration(R, args,
1854                                                   FunctionType::ExtInfo(),
1855                                                   /*variadic*/ false);
1856 
1857   CodeGenTypes &Types = CGF.CGM.getTypes();
1858   llvm::FunctionType *LTy = Types.GetFunctionType(FI);
1859 
1860   // FIXME: We'd like to put these into a mergable by content, with
1861   // internal linkage.
1862   llvm::Function *Fn =
1863     llvm::Function::Create(LTy, llvm::GlobalValue::InternalLinkage,
1864                            "__Block_byref_object_dispose_",
1865                            &CGF.CGM.getModule());
1866 
1867   IdentifierInfo *II
1868     = &Context.Idents.get("__Block_byref_object_dispose_");
1869 
1870   FunctionDecl *FD = FunctionDecl::Create(Context,
1871                                           Context.getTranslationUnitDecl(),
1872                                           SourceLocation(),
1873                                           SourceLocation(), II, R, 0,
1874                                           SC_Static,
1875                                           false, false);
1876   // Initialize debug info if necessary.
1877   CGF.maybeInitializeDebugInfo();
1878   CGF.StartFunction(FD, R, Fn, FI, args, SourceLocation());
1879 
1880   if (byrefInfo.needsDispose()) {
1881     llvm::Value *V = CGF.GetAddrOfLocalVar(&src);
1882     V = CGF.Builder.CreateLoad(V);
1883     V = CGF.Builder.CreateBitCast(V, byrefType.getPointerTo(0));
1884     V = CGF.Builder.CreateStructGEP(V, byrefValueIndex, "x");
1885 
1886     byrefInfo.emitDispose(CGF, V);
1887   }
1888 
1889   CGF.FinishFunction();
1890 
1891   return llvm::ConstantExpr::getBitCast(Fn, CGF.Int8PtrTy);
1892 }
1893 
1894 /// Build the dispose helper for a __block variable.
1895 static llvm::Constant *buildByrefDisposeHelper(CodeGenModule &CGM,
1896                                               llvm::StructType &byrefType,
1897                                                unsigned byrefValueIndex,
1898                                             CodeGenModule::ByrefHelpers &info) {
1899   CodeGenFunction CGF(CGM);
1900   return generateByrefDisposeHelper(CGF, byrefType, byrefValueIndex, info);
1901 }
1902 
1903 /// Lazily build the copy and dispose helpers for a __block variable
1904 /// with the given information.
1905 template <class T> static T *buildByrefHelpers(CodeGenModule &CGM,
1906                                                llvm::StructType &byrefTy,
1907                                                unsigned byrefValueIndex,
1908                                                T &byrefInfo) {
1909   // Increase the field's alignment to be at least pointer alignment,
1910   // since the layout of the byref struct will guarantee at least that.
1911   byrefInfo.Alignment = std::max(byrefInfo.Alignment,
1912                               CharUnits::fromQuantity(CGM.PointerAlignInBytes));
1913 
1914   llvm::FoldingSetNodeID id;
1915   byrefInfo.Profile(id);
1916 
1917   void *insertPos;
1918   CodeGenModule::ByrefHelpers *node
1919     = CGM.ByrefHelpersCache.FindNodeOrInsertPos(id, insertPos);
1920   if (node) return static_cast<T*>(node);
1921 
1922   byrefInfo.CopyHelper =
1923     buildByrefCopyHelper(CGM, byrefTy, byrefValueIndex, byrefInfo);
1924   byrefInfo.DisposeHelper =
1925     buildByrefDisposeHelper(CGM, byrefTy, byrefValueIndex,byrefInfo);
1926 
1927   T *copy = new (CGM.getContext()) T(byrefInfo);
1928   CGM.ByrefHelpersCache.InsertNode(copy, insertPos);
1929   return copy;
1930 }
1931 
1932 /// Build the copy and dispose helpers for the given __block variable
1933 /// emission.  Places the helpers in the global cache.  Returns null
1934 /// if no helpers are required.
1935 CodeGenModule::ByrefHelpers *
1936 CodeGenFunction::buildByrefHelpers(llvm::StructType &byrefType,
1937                                    const AutoVarEmission &emission) {
1938   const VarDecl &var = *emission.Variable;
1939   QualType type = var.getType();
1940 
1941   unsigned byrefValueIndex = getByRefValueLLVMField(&var);
1942 
1943   if (const CXXRecordDecl *record = type->getAsCXXRecordDecl()) {
1944     const Expr *copyExpr = CGM.getContext().getBlockVarCopyInits(&var);
1945     if (!copyExpr && record->hasTrivialDestructor()) return 0;
1946 
1947     CXXByrefHelpers byrefInfo(emission.Alignment, type, copyExpr);
1948     return ::buildByrefHelpers(CGM, byrefType, byrefValueIndex, byrefInfo);
1949   }
1950 
1951   // Otherwise, if we don't have a retainable type, there's nothing to do.
1952   // that the runtime does extra copies.
1953   if (!type->isObjCRetainableType()) return 0;
1954 
1955   Qualifiers qs = type.getQualifiers();
1956 
1957   // If we have lifetime, that dominates.
1958   if (Qualifiers::ObjCLifetime lifetime = qs.getObjCLifetime()) {
1959     assert(getLangOpts().ObjCAutoRefCount);
1960 
1961     switch (lifetime) {
1962     case Qualifiers::OCL_None: llvm_unreachable("impossible");
1963 
1964     // These are just bits as far as the runtime is concerned.
1965     case Qualifiers::OCL_ExplicitNone:
1966     case Qualifiers::OCL_Autoreleasing:
1967       return 0;
1968 
1969     // Tell the runtime that this is ARC __weak, called by the
1970     // byref routines.
1971     case Qualifiers::OCL_Weak: {
1972       ARCWeakByrefHelpers byrefInfo(emission.Alignment);
1973       return ::buildByrefHelpers(CGM, byrefType, byrefValueIndex, byrefInfo);
1974     }
1975 
1976     // ARC __strong __block variables need to be retained.
1977     case Qualifiers::OCL_Strong:
1978       // Block pointers need to be copied, and there's no direct
1979       // transfer possible.
1980       if (type->isBlockPointerType()) {
1981         ARCStrongBlockByrefHelpers byrefInfo(emission.Alignment);
1982         return ::buildByrefHelpers(CGM, byrefType, byrefValueIndex, byrefInfo);
1983 
1984       // Otherwise, we transfer ownership of the retain from the stack
1985       // to the heap.
1986       } else {
1987         ARCStrongByrefHelpers byrefInfo(emission.Alignment);
1988         return ::buildByrefHelpers(CGM, byrefType, byrefValueIndex, byrefInfo);
1989       }
1990     }
1991     llvm_unreachable("fell out of lifetime switch!");
1992   }
1993 
1994   BlockFieldFlags flags;
1995   if (type->isBlockPointerType()) {
1996     flags |= BLOCK_FIELD_IS_BLOCK;
1997   } else if (CGM.getContext().isObjCNSObjectType(type) ||
1998              type->isObjCObjectPointerType()) {
1999     flags |= BLOCK_FIELD_IS_OBJECT;
2000   } else {
2001     return 0;
2002   }
2003 
2004   if (type.isObjCGCWeak())
2005     flags |= BLOCK_FIELD_IS_WEAK;
2006 
2007   ObjectByrefHelpers byrefInfo(emission.Alignment, flags);
2008   return ::buildByrefHelpers(CGM, byrefType, byrefValueIndex, byrefInfo);
2009 }
2010 
2011 unsigned CodeGenFunction::getByRefValueLLVMField(const ValueDecl *VD) const {
2012   assert(ByRefValueInfo.count(VD) && "Did not find value!");
2013 
2014   return ByRefValueInfo.find(VD)->second.second;
2015 }
2016 
2017 llvm::Value *CodeGenFunction::BuildBlockByrefAddress(llvm::Value *BaseAddr,
2018                                                      const VarDecl *V) {
2019   llvm::Value *Loc = Builder.CreateStructGEP(BaseAddr, 1, "forwarding");
2020   Loc = Builder.CreateLoad(Loc);
2021   Loc = Builder.CreateStructGEP(Loc, getByRefValueLLVMField(V),
2022                                 V->getNameAsString());
2023   return Loc;
2024 }
2025 
2026 /// BuildByRefType - This routine changes a __block variable declared as T x
2027 ///   into:
2028 ///
2029 ///      struct {
2030 ///        void *__isa;
2031 ///        void *__forwarding;
2032 ///        int32_t __flags;
2033 ///        int32_t __size;
2034 ///        void *__copy_helper;       // only if needed
2035 ///        void *__destroy_helper;    // only if needed
2036 ///        void *__byref_variable_layout;// only if needed
2037 ///        char padding[X];           // only if needed
2038 ///        T x;
2039 ///      } x
2040 ///
2041 llvm::Type *CodeGenFunction::BuildByRefType(const VarDecl *D) {
2042   std::pair<llvm::Type *, unsigned> &Info = ByRefValueInfo[D];
2043   if (Info.first)
2044     return Info.first;
2045 
2046   QualType Ty = D->getType();
2047 
2048   SmallVector<llvm::Type *, 8> types;
2049 
2050   llvm::StructType *ByRefType =
2051     llvm::StructType::create(getLLVMContext(),
2052                              "struct.__block_byref_" + D->getNameAsString());
2053 
2054   // void *__isa;
2055   types.push_back(Int8PtrTy);
2056 
2057   // void *__forwarding;
2058   types.push_back(llvm::PointerType::getUnqual(ByRefType));
2059 
2060   // int32_t __flags;
2061   types.push_back(Int32Ty);
2062 
2063   // int32_t __size;
2064   types.push_back(Int32Ty);
2065   // Note that this must match *exactly* the logic in buildByrefHelpers.
2066   bool HasCopyAndDispose = getContext().BlockRequiresCopying(Ty, D);
2067   if (HasCopyAndDispose) {
2068     /// void *__copy_helper;
2069     types.push_back(Int8PtrTy);
2070 
2071     /// void *__destroy_helper;
2072     types.push_back(Int8PtrTy);
2073   }
2074   bool HasByrefExtendedLayout = false;
2075   Qualifiers::ObjCLifetime Lifetime;
2076   if (getContext().getByrefLifetime(Ty, Lifetime, HasByrefExtendedLayout) &&
2077       HasByrefExtendedLayout)
2078     /// void *__byref_variable_layout;
2079     types.push_back(Int8PtrTy);
2080 
2081   bool Packed = false;
2082   CharUnits Align = getContext().getDeclAlign(D);
2083   if (Align >
2084       getContext().toCharUnitsFromBits(getTarget().getPointerAlign(0))) {
2085     // We have to insert padding.
2086 
2087     // The struct above has 2 32-bit integers.
2088     unsigned CurrentOffsetInBytes = 4 * 2;
2089 
2090     // And either 2, 3, 4 or 5 pointers.
2091     unsigned noPointers = 2;
2092     if (HasCopyAndDispose)
2093       noPointers += 2;
2094     if (HasByrefExtendedLayout)
2095       noPointers += 1;
2096 
2097     CurrentOffsetInBytes += noPointers * CGM.getDataLayout().getTypeAllocSize(Int8PtrTy);
2098 
2099     // Align the offset.
2100     unsigned AlignedOffsetInBytes =
2101       llvm::RoundUpToAlignment(CurrentOffsetInBytes, Align.getQuantity());
2102 
2103     unsigned NumPaddingBytes = AlignedOffsetInBytes - CurrentOffsetInBytes;
2104     if (NumPaddingBytes > 0) {
2105       llvm::Type *Ty = Int8Ty;
2106       // FIXME: We need a sema error for alignment larger than the minimum of
2107       // the maximal stack alignment and the alignment of malloc on the system.
2108       if (NumPaddingBytes > 1)
2109         Ty = llvm::ArrayType::get(Ty, NumPaddingBytes);
2110 
2111       types.push_back(Ty);
2112 
2113       // We want a packed struct.
2114       Packed = true;
2115     }
2116   }
2117 
2118   // T x;
2119   types.push_back(ConvertTypeForMem(Ty));
2120 
2121   ByRefType->setBody(types, Packed);
2122 
2123   Info.first = ByRefType;
2124 
2125   Info.second = types.size() - 1;
2126 
2127   return Info.first;
2128 }
2129 
2130 /// Initialize the structural components of a __block variable, i.e.
2131 /// everything but the actual object.
2132 void CodeGenFunction::emitByrefStructureInit(const AutoVarEmission &emission) {
2133   // Find the address of the local.
2134   llvm::Value *addr = emission.Address;
2135 
2136   // That's an alloca of the byref structure type.
2137   llvm::StructType *byrefType = cast<llvm::StructType>(
2138                  cast<llvm::PointerType>(addr->getType())->getElementType());
2139 
2140   // Build the byref helpers if necessary.  This is null if we don't need any.
2141   CodeGenModule::ByrefHelpers *helpers =
2142     buildByrefHelpers(*byrefType, emission);
2143 
2144   const VarDecl &D = *emission.Variable;
2145   QualType type = D.getType();
2146 
2147   bool HasByrefExtendedLayout;
2148   Qualifiers::ObjCLifetime ByrefLifetime;
2149   bool ByRefHasLifetime =
2150     getContext().getByrefLifetime(type, ByrefLifetime, HasByrefExtendedLayout);
2151 
2152   llvm::Value *V;
2153 
2154   // Initialize the 'isa', which is just 0 or 1.
2155   int isa = 0;
2156   if (type.isObjCGCWeak())
2157     isa = 1;
2158   V = Builder.CreateIntToPtr(Builder.getInt32(isa), Int8PtrTy, "isa");
2159   Builder.CreateStore(V, Builder.CreateStructGEP(addr, 0, "byref.isa"));
2160 
2161   // Store the address of the variable into its own forwarding pointer.
2162   Builder.CreateStore(addr,
2163                       Builder.CreateStructGEP(addr, 1, "byref.forwarding"));
2164 
2165   // Blocks ABI:
2166   //   c) the flags field is set to either 0 if no helper functions are
2167   //      needed or BLOCK_BYREF_HAS_COPY_DISPOSE if they are,
2168   BlockFlags flags;
2169   if (helpers) flags |= BLOCK_BYREF_HAS_COPY_DISPOSE;
2170   if (ByRefHasLifetime) {
2171     if (HasByrefExtendedLayout) flags |= BLOCK_BYREF_LAYOUT_EXTENDED;
2172       else switch (ByrefLifetime) {
2173         case Qualifiers::OCL_Strong:
2174           flags |= BLOCK_BYREF_LAYOUT_STRONG;
2175           break;
2176         case Qualifiers::OCL_Weak:
2177           flags |= BLOCK_BYREF_LAYOUT_WEAK;
2178           break;
2179         case Qualifiers::OCL_ExplicitNone:
2180           flags |= BLOCK_BYREF_LAYOUT_UNRETAINED;
2181           break;
2182         case Qualifiers::OCL_None:
2183           if (!type->isObjCObjectPointerType() && !type->isBlockPointerType())
2184             flags |= BLOCK_BYREF_LAYOUT_NON_OBJECT;
2185           break;
2186         default:
2187           break;
2188       }
2189     if (CGM.getLangOpts().ObjCGCBitmapPrint) {
2190       printf("\n Inline flag for BYREF variable layout (%d):", flags.getBitMask());
2191       if (flags & BLOCK_BYREF_HAS_COPY_DISPOSE)
2192         printf(" BLOCK_BYREF_HAS_COPY_DISPOSE");
2193       if (flags & BLOCK_BYREF_LAYOUT_MASK) {
2194         BlockFlags ThisFlag(flags.getBitMask() & BLOCK_BYREF_LAYOUT_MASK);
2195         if (ThisFlag ==  BLOCK_BYREF_LAYOUT_EXTENDED)
2196           printf(" BLOCK_BYREF_LAYOUT_EXTENDED");
2197         if (ThisFlag ==  BLOCK_BYREF_LAYOUT_STRONG)
2198           printf(" BLOCK_BYREF_LAYOUT_STRONG");
2199         if (ThisFlag == BLOCK_BYREF_LAYOUT_WEAK)
2200           printf(" BLOCK_BYREF_LAYOUT_WEAK");
2201         if (ThisFlag == BLOCK_BYREF_LAYOUT_UNRETAINED)
2202           printf(" BLOCK_BYREF_LAYOUT_UNRETAINED");
2203         if (ThisFlag == BLOCK_BYREF_LAYOUT_NON_OBJECT)
2204           printf(" BLOCK_BYREF_LAYOUT_NON_OBJECT");
2205       }
2206       printf("\n");
2207     }
2208   }
2209 
2210   Builder.CreateStore(llvm::ConstantInt::get(IntTy, flags.getBitMask()),
2211                       Builder.CreateStructGEP(addr, 2, "byref.flags"));
2212 
2213   CharUnits byrefSize = CGM.GetTargetTypeStoreSize(byrefType);
2214   V = llvm::ConstantInt::get(IntTy, byrefSize.getQuantity());
2215   Builder.CreateStore(V, Builder.CreateStructGEP(addr, 3, "byref.size"));
2216 
2217   if (helpers) {
2218     llvm::Value *copy_helper = Builder.CreateStructGEP(addr, 4);
2219     Builder.CreateStore(helpers->CopyHelper, copy_helper);
2220 
2221     llvm::Value *destroy_helper = Builder.CreateStructGEP(addr, 5);
2222     Builder.CreateStore(helpers->DisposeHelper, destroy_helper);
2223   }
2224   if (ByRefHasLifetime && HasByrefExtendedLayout) {
2225     llvm::Constant* ByrefLayoutInfo = CGM.getObjCRuntime().BuildByrefLayout(CGM, type);
2226     llvm::Value *ByrefInfoAddr = Builder.CreateStructGEP(addr, helpers ? 6 : 4,
2227                                                          "byref.layout");
2228     // cast destination to pointer to source type.
2229     llvm::Type *DesTy = ByrefLayoutInfo->getType();
2230     DesTy = DesTy->getPointerTo();
2231     llvm::Value *BC = Builder.CreatePointerCast(ByrefInfoAddr, DesTy);
2232     Builder.CreateStore(ByrefLayoutInfo, BC);
2233   }
2234 }
2235 
2236 void CodeGenFunction::BuildBlockRelease(llvm::Value *V, BlockFieldFlags flags) {
2237   llvm::Value *F = CGM.getBlockObjectDispose();
2238   llvm::Value *args[] = {
2239     Builder.CreateBitCast(V, Int8PtrTy),
2240     llvm::ConstantInt::get(Int32Ty, flags.getBitMask())
2241   };
2242   EmitNounwindRuntimeCall(F, args); // FIXME: throwing destructors?
2243 }
2244 
2245 namespace {
2246   struct CallBlockRelease : EHScopeStack::Cleanup {
2247     llvm::Value *Addr;
2248     CallBlockRelease(llvm::Value *Addr) : Addr(Addr) {}
2249 
2250     void Emit(CodeGenFunction &CGF, Flags flags) {
2251       // Should we be passing FIELD_IS_WEAK here?
2252       CGF.BuildBlockRelease(Addr, BLOCK_FIELD_IS_BYREF);
2253     }
2254   };
2255 }
2256 
2257 /// Enter a cleanup to destroy a __block variable.  Note that this
2258 /// cleanup should be a no-op if the variable hasn't left the stack
2259 /// yet; if a cleanup is required for the variable itself, that needs
2260 /// to be done externally.
2261 void CodeGenFunction::enterByrefCleanup(const AutoVarEmission &emission) {
2262   // We don't enter this cleanup if we're in pure-GC mode.
2263   if (CGM.getLangOpts().getGC() == LangOptions::GCOnly)
2264     return;
2265 
2266   EHStack.pushCleanup<CallBlockRelease>(NormalAndEHCleanup, emission.Address);
2267 }
2268 
2269 /// Adjust the declaration of something from the blocks API.
2270 static void configureBlocksRuntimeObject(CodeGenModule &CGM,
2271                                          llvm::Constant *C) {
2272   if (!CGM.getLangOpts().BlocksRuntimeOptional) return;
2273 
2274   llvm::GlobalValue *GV = cast<llvm::GlobalValue>(C->stripPointerCasts());
2275   if (GV->isDeclaration() &&
2276       GV->getLinkage() == llvm::GlobalValue::ExternalLinkage)
2277     GV->setLinkage(llvm::GlobalValue::ExternalWeakLinkage);
2278 }
2279 
2280 llvm::Constant *CodeGenModule::getBlockObjectDispose() {
2281   if (BlockObjectDispose)
2282     return BlockObjectDispose;
2283 
2284   llvm::Type *args[] = { Int8PtrTy, Int32Ty };
2285   llvm::FunctionType *fty
2286     = llvm::FunctionType::get(VoidTy, args, false);
2287   BlockObjectDispose = CreateRuntimeFunction(fty, "_Block_object_dispose");
2288   configureBlocksRuntimeObject(*this, BlockObjectDispose);
2289   return BlockObjectDispose;
2290 }
2291 
2292 llvm::Constant *CodeGenModule::getBlockObjectAssign() {
2293   if (BlockObjectAssign)
2294     return BlockObjectAssign;
2295 
2296   llvm::Type *args[] = { Int8PtrTy, Int8PtrTy, Int32Ty };
2297   llvm::FunctionType *fty
2298     = llvm::FunctionType::get(VoidTy, args, false);
2299   BlockObjectAssign = CreateRuntimeFunction(fty, "_Block_object_assign");
2300   configureBlocksRuntimeObject(*this, BlockObjectAssign);
2301   return BlockObjectAssign;
2302 }
2303 
2304 llvm::Constant *CodeGenModule::getNSConcreteGlobalBlock() {
2305   if (NSConcreteGlobalBlock)
2306     return NSConcreteGlobalBlock;
2307 
2308   NSConcreteGlobalBlock = GetOrCreateLLVMGlobal("_NSConcreteGlobalBlock",
2309                                                 Int8PtrTy->getPointerTo(), 0);
2310   configureBlocksRuntimeObject(*this, NSConcreteGlobalBlock);
2311   return NSConcreteGlobalBlock;
2312 }
2313 
2314 llvm::Constant *CodeGenModule::getNSConcreteStackBlock() {
2315   if (NSConcreteStackBlock)
2316     return NSConcreteStackBlock;
2317 
2318   NSConcreteStackBlock = GetOrCreateLLVMGlobal("_NSConcreteStackBlock",
2319                                                Int8PtrTy->getPointerTo(), 0);
2320   configureBlocksRuntimeObject(*this, NSConcreteStackBlock);
2321   return NSConcreteStackBlock;
2322 }
2323