Home | History | Annotate | Download | only in CodeGen
      1 //===--- CGBlocks.cpp - Emit LLVM Code for declarations -------------------===//
      2 //
      3 //                     The LLVM Compiler Infrastructure
      4 //
      5 // This file is distributed under the University of Illinois Open Source
      6 // License. See LICENSE.TXT for details.
      7 //
      8 //===----------------------------------------------------------------------===//
      9 //
     10 // This contains code to emit blocks.
     11 //
     12 //===----------------------------------------------------------------------===//
     13 
     14 #include "CGBlocks.h"
     15 #include "CGDebugInfo.h"
     16 #include "CGObjCRuntime.h"
     17 #include "CodeGenFunction.h"
     18 #include "CodeGenModule.h"
     19 #include "clang/AST/DeclObjC.h"
     20 #include "llvm/ADT/SmallSet.h"
     21 #include "llvm/IR/DataLayout.h"
     22 #include "llvm/IR/Module.h"
     23 #include "llvm/Support/CallSite.h"
     24 #include <algorithm>
     25 #include <cstdio>
     26 
     27 using namespace clang;
     28 using namespace CodeGen;
     29 
     30 CGBlockInfo::CGBlockInfo(const BlockDecl *block, StringRef name)
     31   : Name(name), CXXThisIndex(0), CanBeGlobal(false), NeedsCopyDispose(false),
     32     HasCXXObject(false), UsesStret(false), HasCapturedVariableLayout(false),
     33     StructureType(0), Block(block),
     34     DominatingIP(0) {
     35 
     36   // Skip asm prefix, if any.  'name' is usually taken directly from
     37   // the mangled name of the enclosing function.
     38   if (!name.empty() && name[0] == '\01')
     39     name = name.substr(1);
     40 }
     41 
     42 // Anchor the vtable to this translation unit.
     43 CodeGenModule::ByrefHelpers::~ByrefHelpers() {}
     44 
     45 /// Build the given block as a global block.
     46 static llvm::Constant *buildGlobalBlock(CodeGenModule &CGM,
     47                                         const CGBlockInfo &blockInfo,
     48                                         llvm::Constant *blockFn);
     49 
     50 /// Build the helper function to copy a block.
     51 static llvm::Constant *buildCopyHelper(CodeGenModule &CGM,
     52                                        const CGBlockInfo &blockInfo) {
     53   return CodeGenFunction(CGM).GenerateCopyHelperFunction(blockInfo);
     54 }
     55 
     56 /// Build the helper function to dipose of a block.
     57 static llvm::Constant *buildDisposeHelper(CodeGenModule &CGM,
     58                                           const CGBlockInfo &blockInfo) {
     59   return CodeGenFunction(CGM).GenerateDestroyHelperFunction(blockInfo);
     60 }
     61 
     62 /// buildBlockDescriptor - Build the block descriptor meta-data for a block.
     63 /// buildBlockDescriptor is accessed from 5th field of the Block_literal
     64 /// meta-data and contains stationary information about the block literal.
     65 /// Its definition will have 4 (or optinally 6) words.
     66 /// \code
     67 /// struct Block_descriptor {
     68 ///   unsigned long reserved;
     69 ///   unsigned long size;  // size of Block_literal metadata in bytes.
     70 ///   void *copy_func_helper_decl;  // optional copy helper.
     71 ///   void *destroy_func_decl; // optioanl destructor helper.
     72 ///   void *block_method_encoding_address; // @encode for block literal signature.
     73 ///   void *block_layout_info; // encoding of captured block variables.
     74 /// };
     75 /// \endcode
     76 static llvm::Constant *buildBlockDescriptor(CodeGenModule &CGM,
     77                                             const CGBlockInfo &blockInfo) {
     78   ASTContext &C = CGM.getContext();
     79 
     80   llvm::Type *ulong = CGM.getTypes().ConvertType(C.UnsignedLongTy);
     81   llvm::Type *i8p = CGM.getTypes().ConvertType(C.VoidPtrTy);
     82 
     83   SmallVector<llvm::Constant*, 6> elements;
     84 
     85   // reserved
     86   elements.push_back(llvm::ConstantInt::get(ulong, 0));
     87 
     88   // Size
     89   // FIXME: What is the right way to say this doesn't fit?  We should give
     90   // a user diagnostic in that case.  Better fix would be to change the
     91   // API to size_t.
     92   elements.push_back(llvm::ConstantInt::get(ulong,
     93                                             blockInfo.BlockSize.getQuantity()));
     94 
     95   // Optional copy/dispose helpers.
     96   if (blockInfo.NeedsCopyDispose) {
     97     // copy_func_helper_decl
     98     elements.push_back(buildCopyHelper(CGM, blockInfo));
     99 
    100     // destroy_func_decl
    101     elements.push_back(buildDisposeHelper(CGM, blockInfo));
    102   }
    103 
    104   // Signature.  Mandatory ObjC-style method descriptor @encode sequence.
    105   std::string typeAtEncoding =
    106     CGM.getContext().getObjCEncodingForBlock(blockInfo.getBlockExpr());
    107   elements.push_back(llvm::ConstantExpr::getBitCast(
    108                           CGM.GetAddrOfConstantCString(typeAtEncoding), i8p));
    109 
    110   // GC layout.
    111   if (C.getLangOpts().ObjC1) {
    112     if (CGM.getLangOpts().getGC() != LangOptions::NonGC)
    113       elements.push_back(CGM.getObjCRuntime().BuildGCBlockLayout(CGM, blockInfo));
    114     else
    115       elements.push_back(CGM.getObjCRuntime().BuildRCBlockLayout(CGM, blockInfo));
    116   }
    117   else
    118     elements.push_back(llvm::Constant::getNullValue(i8p));
    119 
    120   llvm::Constant *init = llvm::ConstantStruct::getAnon(elements);
    121 
    122   llvm::GlobalVariable *global =
    123     new llvm::GlobalVariable(CGM.getModule(), init->getType(), true,
    124                              llvm::GlobalValue::InternalLinkage,
    125                              init, "__block_descriptor_tmp");
    126 
    127   return llvm::ConstantExpr::getBitCast(global, CGM.getBlockDescriptorType());
    128 }
    129 
    130 /*
    131   Purely notional variadic template describing the layout of a block.
    132 
    133   template <class _ResultType, class... _ParamTypes, class... _CaptureTypes>
    134   struct Block_literal {
    135     /// Initialized to one of:
    136     ///   extern void *_NSConcreteStackBlock[];
    137     ///   extern void *_NSConcreteGlobalBlock[];
    138     ///
    139     /// In theory, we could start one off malloc'ed by setting
    140     /// BLOCK_NEEDS_FREE, giving it a refcount of 1, and using
    141     /// this isa:
    142     ///   extern void *_NSConcreteMallocBlock[];
    143     struct objc_class *isa;
    144 
    145     /// These are the flags (with corresponding bit number) that the
    146     /// compiler is actually supposed to know about.
    147     ///  25. BLOCK_HAS_COPY_DISPOSE - indicates that the block
    148     ///   descriptor provides copy and dispose helper functions
    149     ///  26. BLOCK_HAS_CXX_OBJ - indicates that there's a captured
    150     ///   object with a nontrivial destructor or copy constructor
    151     ///  28. BLOCK_IS_GLOBAL - indicates that the block is allocated
    152     ///   as global memory
    153     ///  29. BLOCK_USE_STRET - indicates that the block function
    154     ///   uses stret, which objc_msgSend needs to know about
    155     ///  30. BLOCK_HAS_SIGNATURE - indicates that the block has an
    156     ///   @encoded signature string
    157     /// And we're not supposed to manipulate these:
    158     ///  24. BLOCK_NEEDS_FREE - indicates that the block has been moved
    159     ///   to malloc'ed memory
    160     ///  27. BLOCK_IS_GC - indicates that the block has been moved to
    161     ///   to GC-allocated memory
    162     /// Additionally, the bottom 16 bits are a reference count which
    163     /// should be zero on the stack.
    164     int flags;
    165 
    166     /// Reserved;  should be zero-initialized.
    167     int reserved;
    168 
    169     /// Function pointer generated from block literal.
    170     _ResultType (*invoke)(Block_literal *, _ParamTypes...);
    171 
    172     /// Block description metadata generated from block literal.
    173     struct Block_descriptor *block_descriptor;
    174 
    175     /// Captured values follow.
    176     _CapturesTypes captures...;
    177   };
    178  */
    179 
    180 /// The number of fields in a block header.
    181 const unsigned BlockHeaderSize = 5;
    182 
    183 namespace {
    184   /// A chunk of data that we actually have to capture in the block.
    185   struct BlockLayoutChunk {
    186     CharUnits Alignment;
    187     CharUnits Size;
    188     Qualifiers::ObjCLifetime Lifetime;
    189     const BlockDecl::Capture *Capture; // null for 'this'
    190     llvm::Type *Type;
    191 
    192     BlockLayoutChunk(CharUnits align, CharUnits size,
    193                      Qualifiers::ObjCLifetime lifetime,
    194                      const BlockDecl::Capture *capture,
    195                      llvm::Type *type)
    196       : Alignment(align), Size(size), Lifetime(lifetime),
    197         Capture(capture), Type(type) {}
    198 
    199     /// Tell the block info that this chunk has the given field index.
    200     void setIndex(CGBlockInfo &info, unsigned index) {
    201       if (!Capture)
    202         info.CXXThisIndex = index;
    203       else
    204         info.Captures[Capture->getVariable()]
    205           = CGBlockInfo::Capture::makeIndex(index);
    206     }
    207   };
    208 
    209   /// Order by 1) all __strong together 2) next, all byfref together 3) next,
    210   /// all __weak together. Preserve descending alignment in all situations.
    211   bool operator<(const BlockLayoutChunk &left, const BlockLayoutChunk &right) {
    212     CharUnits LeftValue, RightValue;
    213     bool LeftByref = left.Capture ? left.Capture->isByRef() : false;
    214     bool RightByref = right.Capture ? right.Capture->isByRef() : false;
    215 
    216     if (left.Lifetime == Qualifiers::OCL_Strong &&
    217         left.Alignment >= right.Alignment)
    218       LeftValue = CharUnits::fromQuantity(64);
    219     else if (LeftByref && left.Alignment >= right.Alignment)
    220       LeftValue = CharUnits::fromQuantity(32);
    221     else if (left.Lifetime == Qualifiers::OCL_Weak &&
    222              left.Alignment >= right.Alignment)
    223       LeftValue = CharUnits::fromQuantity(16);
    224     else
    225       LeftValue = left.Alignment;
    226     if (right.Lifetime == Qualifiers::OCL_Strong &&
    227         right.Alignment >= left.Alignment)
    228       RightValue = CharUnits::fromQuantity(64);
    229     else if (RightByref && right.Alignment >= left.Alignment)
    230       RightValue = CharUnits::fromQuantity(32);
    231     else if (right.Lifetime == Qualifiers::OCL_Weak &&
    232              right.Alignment >= left.Alignment)
    233       RightValue = CharUnits::fromQuantity(16);
    234     else
    235       RightValue = right.Alignment;
    236 
    237       return LeftValue > RightValue;
    238   }
    239 }
    240 
    241 /// Determines if the given type is safe for constant capture in C++.
    242 static bool isSafeForCXXConstantCapture(QualType type) {
    243   const RecordType *recordType =
    244     type->getBaseElementTypeUnsafe()->getAs<RecordType>();
    245 
    246   // Only records can be unsafe.
    247   if (!recordType) return true;
    248 
    249   const CXXRecordDecl *record = cast<CXXRecordDecl>(recordType->getDecl());
    250 
    251   // Maintain semantics for classes with non-trivial dtors or copy ctors.
    252   if (!record->hasTrivialDestructor()) return false;
    253   if (record->hasNonTrivialCopyConstructor()) return false;
    254 
    255   // Otherwise, we just have to make sure there aren't any mutable
    256   // fields that might have changed since initialization.
    257   return !record->hasMutableFields();
    258 }
    259 
    260 /// It is illegal to modify a const object after initialization.
    261 /// Therefore, if a const object has a constant initializer, we don't
    262 /// actually need to keep storage for it in the block; we'll just
    263 /// rematerialize it at the start of the block function.  This is
    264 /// acceptable because we make no promises about address stability of
    265 /// captured variables.
    266 static llvm::Constant *tryCaptureAsConstant(CodeGenModule &CGM,
    267                                             CodeGenFunction *CGF,
    268                                             const VarDecl *var) {
    269   QualType type = var->getType();
    270 
    271   // We can only do this if the variable is const.
    272   if (!type.isConstQualified()) return 0;
    273 
    274   // Furthermore, in C++ we have to worry about mutable fields:
    275   // C++ [dcl.type.cv]p4:
    276   //   Except that any class member declared mutable can be
    277   //   modified, any attempt to modify a const object during its
    278   //   lifetime results in undefined behavior.
    279   if (CGM.getLangOpts().CPlusPlus && !isSafeForCXXConstantCapture(type))
    280     return 0;
    281 
    282   // If the variable doesn't have any initializer (shouldn't this be
    283   // invalid?), it's not clear what we should do.  Maybe capture as
    284   // zero?
    285   const Expr *init = var->getInit();
    286   if (!init) return 0;
    287 
    288   return CGM.EmitConstantInit(*var, CGF);
    289 }
    290 
    291 /// Get the low bit of a nonzero character count.  This is the
    292 /// alignment of the nth byte if the 0th byte is universally aligned.
    293 static CharUnits getLowBit(CharUnits v) {
    294   return CharUnits::fromQuantity(v.getQuantity() & (~v.getQuantity() + 1));
    295 }
    296 
    297 static void initializeForBlockHeader(CodeGenModule &CGM, CGBlockInfo &info,
    298                              SmallVectorImpl<llvm::Type*> &elementTypes) {
    299   ASTContext &C = CGM.getContext();
    300 
    301   // The header is basically a 'struct { void *; int; int; void *; void *; }'.
    302   CharUnits ptrSize, ptrAlign, intSize, intAlign;
    303   llvm::tie(ptrSize, ptrAlign) = C.getTypeInfoInChars(C.VoidPtrTy);
    304   llvm::tie(intSize, intAlign) = C.getTypeInfoInChars(C.IntTy);
    305 
    306   // Are there crazy embedded platforms where this isn't true?
    307   assert(intSize <= ptrSize && "layout assumptions horribly violated");
    308 
    309   CharUnits headerSize = ptrSize;
    310   if (2 * intSize < ptrAlign) headerSize += ptrSize;
    311   else headerSize += 2 * intSize;
    312   headerSize += 2 * ptrSize;
    313 
    314   info.BlockAlign = ptrAlign;
    315   info.BlockSize = headerSize;
    316 
    317   assert(elementTypes.empty());
    318   llvm::Type *i8p = CGM.getTypes().ConvertType(C.VoidPtrTy);
    319   llvm::Type *intTy = CGM.getTypes().ConvertType(C.IntTy);
    320   elementTypes.push_back(i8p);
    321   elementTypes.push_back(intTy);
    322   elementTypes.push_back(intTy);
    323   elementTypes.push_back(i8p);
    324   elementTypes.push_back(CGM.getBlockDescriptorType());
    325 
    326   assert(elementTypes.size() == BlockHeaderSize);
    327 }
    328 
    329 /// Compute the layout of the given block.  Attempts to lay the block
    330 /// out with minimal space requirements.
    331 static void computeBlockInfo(CodeGenModule &CGM, CodeGenFunction *CGF,
    332                              CGBlockInfo &info) {
    333   ASTContext &C = CGM.getContext();
    334   const BlockDecl *block = info.getBlockDecl();
    335 
    336   SmallVector<llvm::Type*, 8> elementTypes;
    337   initializeForBlockHeader(CGM, info, elementTypes);
    338 
    339   if (!block->hasCaptures()) {
    340     info.StructureType =
    341       llvm::StructType::get(CGM.getLLVMContext(), elementTypes, true);
    342     info.CanBeGlobal = true;
    343     return;
    344   }
    345   else if (C.getLangOpts().ObjC1 &&
    346            CGM.getLangOpts().getGC() == LangOptions::NonGC)
    347     info.HasCapturedVariableLayout = true;
    348 
    349   // Collect the layout chunks.
    350   SmallVector<BlockLayoutChunk, 16> layout;
    351   layout.reserve(block->capturesCXXThis() +
    352                  (block->capture_end() - block->capture_begin()));
    353 
    354   CharUnits maxFieldAlign;
    355 
    356   // First, 'this'.
    357   if (block->capturesCXXThis()) {
    358     assert(CGF && CGF->CurFuncDecl && isa<CXXMethodDecl>(CGF->CurFuncDecl) &&
    359            "Can't capture 'this' outside a method");
    360     QualType thisType = cast<CXXMethodDecl>(CGF->CurFuncDecl)->getThisType(C);
    361 
    362     llvm::Type *llvmType = CGM.getTypes().ConvertType(thisType);
    363     std::pair<CharUnits,CharUnits> tinfo
    364       = CGM.getContext().getTypeInfoInChars(thisType);
    365     maxFieldAlign = std::max(maxFieldAlign, tinfo.second);
    366 
    367     layout.push_back(BlockLayoutChunk(tinfo.second, tinfo.first,
    368                                       Qualifiers::OCL_None,
    369                                       0, llvmType));
    370   }
    371 
    372   // Next, all the block captures.
    373   for (BlockDecl::capture_const_iterator ci = block->capture_begin(),
    374          ce = block->capture_end(); ci != ce; ++ci) {
    375     const VarDecl *variable = ci->getVariable();
    376 
    377     if (ci->isByRef()) {
    378       // We have to copy/dispose of the __block reference.
    379       info.NeedsCopyDispose = true;
    380 
    381       // Just use void* instead of a pointer to the byref type.
    382       QualType byRefPtrTy = C.VoidPtrTy;
    383 
    384       llvm::Type *llvmType = CGM.getTypes().ConvertType(byRefPtrTy);
    385       std::pair<CharUnits,CharUnits> tinfo
    386         = CGM.getContext().getTypeInfoInChars(byRefPtrTy);
    387       maxFieldAlign = std::max(maxFieldAlign, tinfo.second);
    388 
    389       layout.push_back(BlockLayoutChunk(tinfo.second, tinfo.first,
    390                                         Qualifiers::OCL_None,
    391                                         &*ci, llvmType));
    392       continue;
    393     }
    394 
    395     // Otherwise, build a layout chunk with the size and alignment of
    396     // the declaration.
    397     if (llvm::Constant *constant = tryCaptureAsConstant(CGM, CGF, variable)) {
    398       info.Captures[variable] = CGBlockInfo::Capture::makeConstant(constant);
    399       continue;
    400     }
    401 
    402     // If we have a lifetime qualifier, honor it for capture purposes.
    403     // That includes *not* copying it if it's __unsafe_unretained.
    404     Qualifiers::ObjCLifetime lifetime =
    405       variable->getType().getObjCLifetime();
    406     if (lifetime) {
    407       switch (lifetime) {
    408       case Qualifiers::OCL_None: llvm_unreachable("impossible");
    409       case Qualifiers::OCL_ExplicitNone:
    410       case Qualifiers::OCL_Autoreleasing:
    411         break;
    412 
    413       case Qualifiers::OCL_Strong:
    414       case Qualifiers::OCL_Weak:
    415         info.NeedsCopyDispose = true;
    416       }
    417 
    418     // Block pointers require copy/dispose.  So do Objective-C pointers.
    419     } else if (variable->getType()->isObjCRetainableType()) {
    420       info.NeedsCopyDispose = true;
    421       // used for mrr below.
    422       lifetime = Qualifiers::OCL_Strong;
    423 
    424     // So do types that require non-trivial copy construction.
    425     } else if (ci->hasCopyExpr()) {
    426       info.NeedsCopyDispose = true;
    427       info.HasCXXObject = true;
    428 
    429     // And so do types with destructors.
    430     } else if (CGM.getLangOpts().CPlusPlus) {
    431       if (const CXXRecordDecl *record =
    432             variable->getType()->getAsCXXRecordDecl()) {
    433         if (!record->hasTrivialDestructor()) {
    434           info.HasCXXObject = true;
    435           info.NeedsCopyDispose = true;
    436         }
    437       }
    438     }
    439 
    440     QualType VT = variable->getType();
    441     CharUnits size = C.getTypeSizeInChars(VT);
    442     CharUnits align = C.getDeclAlign(variable);
    443 
    444     maxFieldAlign = std::max(maxFieldAlign, align);
    445 
    446     llvm::Type *llvmType =
    447       CGM.getTypes().ConvertTypeForMem(VT);
    448 
    449     layout.push_back(BlockLayoutChunk(align, size, lifetime, &*ci, llvmType));
    450   }
    451 
    452   // If that was everything, we're done here.
    453   if (layout.empty()) {
    454     info.StructureType =
    455       llvm::StructType::get(CGM.getLLVMContext(), elementTypes, true);
    456     info.CanBeGlobal = true;
    457     return;
    458   }
    459 
    460   // Sort the layout by alignment.  We have to use a stable sort here
    461   // to get reproducible results.  There should probably be an
    462   // llvm::array_pod_stable_sort.
    463   std::stable_sort(layout.begin(), layout.end());
    464 
    465   // Needed for blocks layout info.
    466   info.BlockHeaderForcedGapOffset = info.BlockSize;
    467   info.BlockHeaderForcedGapSize = CharUnits::Zero();
    468 
    469   CharUnits &blockSize = info.BlockSize;
    470   info.BlockAlign = std::max(maxFieldAlign, info.BlockAlign);
    471 
    472   // Assuming that the first byte in the header is maximally aligned,
    473   // get the alignment of the first byte following the header.
    474   CharUnits endAlign = getLowBit(blockSize);
    475 
    476   // If the end of the header isn't satisfactorily aligned for the
    477   // maximum thing, look for things that are okay with the header-end
    478   // alignment, and keep appending them until we get something that's
    479   // aligned right.  This algorithm is only guaranteed optimal if
    480   // that condition is satisfied at some point; otherwise we can get
    481   // things like:
    482   //   header                 // next byte has alignment 4
    483   //   something_with_size_5; // next byte has alignment 1
    484   //   something_with_alignment_8;
    485   // which has 7 bytes of padding, as opposed to the naive solution
    486   // which might have less (?).
    487   if (endAlign < maxFieldAlign) {
    488     SmallVectorImpl<BlockLayoutChunk>::iterator
    489       li = layout.begin() + 1, le = layout.end();
    490 
    491     // Look for something that the header end is already
    492     // satisfactorily aligned for.
    493     for (; li != le && endAlign < li->Alignment; ++li)
    494       ;
    495 
    496     // If we found something that's naturally aligned for the end of
    497     // the header, keep adding things...
    498     if (li != le) {
    499       SmallVectorImpl<BlockLayoutChunk>::iterator first = li;
    500       for (; li != le; ++li) {
    501         assert(endAlign >= li->Alignment);
    502 
    503         li->setIndex(info, elementTypes.size());
    504         elementTypes.push_back(li->Type);
    505         blockSize += li->Size;
    506         endAlign = getLowBit(blockSize);
    507 
    508         // ...until we get to the alignment of the maximum field.
    509         if (endAlign >= maxFieldAlign) {
    510           if (li == first) {
    511             // No user field was appended. So, a gap was added.
    512             // Save total gap size for use in block layout bit map.
    513             info.BlockHeaderForcedGapSize = li->Size;
    514           }
    515           break;
    516         }
    517       }
    518       // Don't re-append everything we just appended.
    519       layout.erase(first, li);
    520     }
    521   }
    522 
    523   assert(endAlign == getLowBit(blockSize));
    524 
    525   // At this point, we just have to add padding if the end align still
    526   // isn't aligned right.
    527   if (endAlign < maxFieldAlign) {
    528     CharUnits newBlockSize = blockSize.RoundUpToAlignment(maxFieldAlign);
    529     CharUnits padding = newBlockSize - blockSize;
    530 
    531     elementTypes.push_back(llvm::ArrayType::get(CGM.Int8Ty,
    532                                                 padding.getQuantity()));
    533     blockSize = newBlockSize;
    534     endAlign = getLowBit(blockSize); // might be > maxFieldAlign
    535   }
    536 
    537   assert(endAlign >= maxFieldAlign);
    538   assert(endAlign == getLowBit(blockSize));
    539   // Slam everything else on now.  This works because they have
    540   // strictly decreasing alignment and we expect that size is always a
    541   // multiple of alignment.
    542   for (SmallVectorImpl<BlockLayoutChunk>::iterator
    543          li = layout.begin(), le = layout.end(); li != le; ++li) {
    544     assert(endAlign >= li->Alignment);
    545     li->setIndex(info, elementTypes.size());
    546     elementTypes.push_back(li->Type);
    547     blockSize += li->Size;
    548     endAlign = getLowBit(blockSize);
    549   }
    550 
    551   info.StructureType =
    552     llvm::StructType::get(CGM.getLLVMContext(), elementTypes, true);
    553 }
    554 
    555 /// Enter the scope of a block.  This should be run at the entrance to
    556 /// a full-expression so that the block's cleanups are pushed at the
    557 /// right place in the stack.
    558 static void enterBlockScope(CodeGenFunction &CGF, BlockDecl *block) {
    559   assert(CGF.HaveInsertPoint());
    560 
    561   // Allocate the block info and place it at the head of the list.
    562   CGBlockInfo &blockInfo =
    563     *new CGBlockInfo(block, CGF.CurFn->getName());
    564   blockInfo.NextBlockInfo = CGF.FirstBlockInfo;
    565   CGF.FirstBlockInfo = &blockInfo;
    566 
    567   // Compute information about the layout, etc., of this block,
    568   // pushing cleanups as necessary.
    569   computeBlockInfo(CGF.CGM, &CGF, blockInfo);
    570 
    571   // Nothing else to do if it can be global.
    572   if (blockInfo.CanBeGlobal) return;
    573 
    574   // Make the allocation for the block.
    575   blockInfo.Address =
    576     CGF.CreateTempAlloca(blockInfo.StructureType, "block");
    577   blockInfo.Address->setAlignment(blockInfo.BlockAlign.getQuantity());
    578 
    579   // If there are cleanups to emit, enter them (but inactive).
    580   if (!blockInfo.NeedsCopyDispose) return;
    581 
    582   // Walk through the captures (in order) and find the ones not
    583   // captured by constant.
    584   for (BlockDecl::capture_const_iterator ci = block->capture_begin(),
    585          ce = block->capture_end(); ci != ce; ++ci) {
    586     // Ignore __block captures; there's nothing special in the
    587     // on-stack block that we need to do for them.
    588     if (ci->isByRef()) continue;
    589 
    590     // Ignore variables that are constant-captured.
    591     const VarDecl *variable = ci->getVariable();
    592     CGBlockInfo::Capture &capture = blockInfo.getCapture(variable);
    593     if (capture.isConstant()) continue;
    594 
    595     // Ignore objects that aren't destructed.
    596     QualType::DestructionKind dtorKind =
    597       variable->getType().isDestructedType();
    598     if (dtorKind == QualType::DK_none) continue;
    599 
    600     CodeGenFunction::Destroyer *destroyer;
    601 
    602     // Block captures count as local values and have imprecise semantics.
    603     // They also can't be arrays, so need to worry about that.
    604     if (dtorKind == QualType::DK_objc_strong_lifetime) {
    605       destroyer = CodeGenFunction::destroyARCStrongImprecise;
    606     } else {
    607       destroyer = CGF.getDestroyer(dtorKind);
    608     }
    609 
    610     // GEP down to the address.
    611     llvm::Value *addr = CGF.Builder.CreateStructGEP(blockInfo.Address,
    612                                                     capture.getIndex());
    613 
    614     // We can use that GEP as the dominating IP.
    615     if (!blockInfo.DominatingIP)
    616       blockInfo.DominatingIP = cast<llvm::Instruction>(addr);
    617 
    618     CleanupKind cleanupKind = InactiveNormalCleanup;
    619     bool useArrayEHCleanup = CGF.needsEHCleanup(dtorKind);
    620     if (useArrayEHCleanup)
    621       cleanupKind = InactiveNormalAndEHCleanup;
    622 
    623     CGF.pushDestroy(cleanupKind, addr, variable->getType(),
    624                     destroyer, useArrayEHCleanup);
    625 
    626     // Remember where that cleanup was.
    627     capture.setCleanup(CGF.EHStack.stable_begin());
    628   }
    629 }
    630 
    631 /// Enter a full-expression with a non-trivial number of objects to
    632 /// clean up.  This is in this file because, at the moment, the only
    633 /// kind of cleanup object is a BlockDecl*.
    634 void CodeGenFunction::enterNonTrivialFullExpression(const ExprWithCleanups *E) {
    635   assert(E->getNumObjects() != 0);
    636   ArrayRef<ExprWithCleanups::CleanupObject> cleanups = E->getObjects();
    637   for (ArrayRef<ExprWithCleanups::CleanupObject>::iterator
    638          i = cleanups.begin(), e = cleanups.end(); i != e; ++i) {
    639     enterBlockScope(*this, *i);
    640   }
    641 }
    642 
    643 /// Find the layout for the given block in a linked list and remove it.
    644 static CGBlockInfo *findAndRemoveBlockInfo(CGBlockInfo **head,
    645                                            const BlockDecl *block) {
    646   while (true) {
    647     assert(head && *head);
    648     CGBlockInfo *cur = *head;
    649 
    650     // If this is the block we're looking for, splice it out of the list.
    651     if (cur->getBlockDecl() == block) {
    652       *head = cur->NextBlockInfo;
    653       return cur;
    654     }
    655 
    656     head = &cur->NextBlockInfo;
    657   }
    658 }
    659 
    660 /// Destroy a chain of block layouts.
    661 void CodeGenFunction::destroyBlockInfos(CGBlockInfo *head) {
    662   assert(head && "destroying an empty chain");
    663   do {
    664     CGBlockInfo *cur = head;
    665     head = cur->NextBlockInfo;
    666     delete cur;
    667   } while (head != 0);
    668 }
    669 
    670 /// Emit a block literal expression in the current function.
    671 llvm::Value *CodeGenFunction::EmitBlockLiteral(const BlockExpr *blockExpr) {
    672   // If the block has no captures, we won't have a pre-computed
    673   // layout for it.
    674   if (!blockExpr->getBlockDecl()->hasCaptures()) {
    675     CGBlockInfo blockInfo(blockExpr->getBlockDecl(), CurFn->getName());
    676     computeBlockInfo(CGM, this, blockInfo);
    677     blockInfo.BlockExpression = blockExpr;
    678     return EmitBlockLiteral(blockInfo);
    679   }
    680 
    681   // Find the block info for this block and take ownership of it.
    682   OwningPtr<CGBlockInfo> blockInfo;
    683   blockInfo.reset(findAndRemoveBlockInfo(&FirstBlockInfo,
    684                                          blockExpr->getBlockDecl()));
    685 
    686   blockInfo->BlockExpression = blockExpr;
    687   return EmitBlockLiteral(*blockInfo);
    688 }
    689 
    690 llvm::Value *CodeGenFunction::EmitBlockLiteral(const CGBlockInfo &blockInfo) {
    691   // Using the computed layout, generate the actual block function.
    692   bool isLambdaConv = blockInfo.getBlockDecl()->isConversionFromLambda();
    693   llvm::Constant *blockFn
    694     = CodeGenFunction(CGM, true).GenerateBlockFunction(CurGD, blockInfo,
    695                                                        LocalDeclMap,
    696                                                        isLambdaConv);
    697   blockFn = llvm::ConstantExpr::getBitCast(blockFn, VoidPtrTy);
    698 
    699   // If there is nothing to capture, we can emit this as a global block.
    700   if (blockInfo.CanBeGlobal)
    701     return buildGlobalBlock(CGM, blockInfo, blockFn);
    702 
    703   // Otherwise, we have to emit this as a local block.
    704 
    705   llvm::Constant *isa = CGM.getNSConcreteStackBlock();
    706   isa = llvm::ConstantExpr::getBitCast(isa, VoidPtrTy);
    707 
    708   // Build the block descriptor.
    709   llvm::Constant *descriptor = buildBlockDescriptor(CGM, blockInfo);
    710 
    711   llvm::AllocaInst *blockAddr = blockInfo.Address;
    712   assert(blockAddr && "block has no address!");
    713 
    714   // Compute the initial on-stack block flags.
    715   BlockFlags flags = BLOCK_HAS_SIGNATURE;
    716   if (blockInfo.HasCapturedVariableLayout) flags |= BLOCK_HAS_EXTENDED_LAYOUT;
    717   if (blockInfo.NeedsCopyDispose) flags |= BLOCK_HAS_COPY_DISPOSE;
    718   if (blockInfo.HasCXXObject) flags |= BLOCK_HAS_CXX_OBJ;
    719   if (blockInfo.UsesStret) flags |= BLOCK_USE_STRET;
    720 
    721   // Initialize the block literal.
    722   Builder.CreateStore(isa, Builder.CreateStructGEP(blockAddr, 0, "block.isa"));
    723   Builder.CreateStore(llvm::ConstantInt::get(IntTy, flags.getBitMask()),
    724                       Builder.CreateStructGEP(blockAddr, 1, "block.flags"));
    725   Builder.CreateStore(llvm::ConstantInt::get(IntTy, 0),
    726                       Builder.CreateStructGEP(blockAddr, 2, "block.reserved"));
    727   Builder.CreateStore(blockFn, Builder.CreateStructGEP(blockAddr, 3,
    728                                                        "block.invoke"));
    729   Builder.CreateStore(descriptor, Builder.CreateStructGEP(blockAddr, 4,
    730                                                           "block.descriptor"));
    731 
    732   // Finally, capture all the values into the block.
    733   const BlockDecl *blockDecl = blockInfo.getBlockDecl();
    734 
    735   // First, 'this'.
    736   if (blockDecl->capturesCXXThis()) {
    737     llvm::Value *addr = Builder.CreateStructGEP(blockAddr,
    738                                                 blockInfo.CXXThisIndex,
    739                                                 "block.captured-this.addr");
    740     Builder.CreateStore(LoadCXXThis(), addr);
    741   }
    742 
    743   // Next, captured variables.
    744   for (BlockDecl::capture_const_iterator ci = blockDecl->capture_begin(),
    745          ce = blockDecl->capture_end(); ci != ce; ++ci) {
    746     const VarDecl *variable = ci->getVariable();
    747     const CGBlockInfo::Capture &capture = blockInfo.getCapture(variable);
    748 
    749     // Ignore constant captures.
    750     if (capture.isConstant()) continue;
    751 
    752     QualType type = variable->getType();
    753     CharUnits align = getContext().getDeclAlign(variable);
    754 
    755     // This will be a [[type]]*, except that a byref entry will just be
    756     // an i8**.
    757     llvm::Value *blockField =
    758       Builder.CreateStructGEP(blockAddr, capture.getIndex(),
    759                               "block.captured");
    760 
    761     // Compute the address of the thing we're going to move into the
    762     // block literal.
    763     llvm::Value *src;
    764     if (BlockInfo && ci->isNested()) {
    765       // We need to use the capture from the enclosing block.
    766       const CGBlockInfo::Capture &enclosingCapture =
    767         BlockInfo->getCapture(variable);
    768 
    769       // This is a [[type]]*, except that a byref entry wil just be an i8**.
    770       src = Builder.CreateStructGEP(LoadBlockStruct(),
    771                                     enclosingCapture.getIndex(),
    772                                     "block.capture.addr");
    773     } else if (blockDecl->isConversionFromLambda()) {
    774       // The lambda capture in a lambda's conversion-to-block-pointer is
    775       // special; we'll simply emit it directly.
    776       src = 0;
    777     } else {
    778       // Just look it up in the locals map, which will give us back a
    779       // [[type]]*.  If that doesn't work, do the more elaborate DRE
    780       // emission.
    781       src = LocalDeclMap.lookup(variable);
    782       if (!src) {
    783         DeclRefExpr declRef(const_cast<VarDecl*>(variable),
    784                             /*refersToEnclosing*/ ci->isNested(), type,
    785                             VK_LValue, SourceLocation());
    786         src = EmitDeclRefLValue(&declRef).getAddress();
    787       }
    788     }
    789 
    790     // For byrefs, we just write the pointer to the byref struct into
    791     // the block field.  There's no need to chase the forwarding
    792     // pointer at this point, since we're building something that will
    793     // live a shorter life than the stack byref anyway.
    794     if (ci->isByRef()) {
    795       // Get a void* that points to the byref struct.
    796       if (ci->isNested())
    797         src = Builder.CreateAlignedLoad(src, align.getQuantity(),
    798                                         "byref.capture");
    799       else
    800         src = Builder.CreateBitCast(src, VoidPtrTy);
    801 
    802       // Write that void* into the capture field.
    803       Builder.CreateAlignedStore(src, blockField, align.getQuantity());
    804 
    805     // If we have a copy constructor, evaluate that into the block field.
    806     } else if (const Expr *copyExpr = ci->getCopyExpr()) {
    807       if (blockDecl->isConversionFromLambda()) {
    808         // If we have a lambda conversion, emit the expression
    809         // directly into the block instead.
    810         AggValueSlot Slot =
    811             AggValueSlot::forAddr(blockField, align, Qualifiers(),
    812                                   AggValueSlot::IsDestructed,
    813                                   AggValueSlot::DoesNotNeedGCBarriers,
    814                                   AggValueSlot::IsNotAliased);
    815         EmitAggExpr(copyExpr, Slot);
    816       } else {
    817         EmitSynthesizedCXXCopyCtor(blockField, src, copyExpr);
    818       }
    819 
    820     // If it's a reference variable, copy the reference into the block field.
    821     } else if (type->isReferenceType()) {
    822       llvm::Value *ref =
    823         Builder.CreateAlignedLoad(src, align.getQuantity(), "ref.val");
    824       Builder.CreateAlignedStore(ref, blockField, align.getQuantity());
    825 
    826     // If this is an ARC __strong block-pointer variable, don't do a
    827     // block copy.
    828     //
    829     // TODO: this can be generalized into the normal initialization logic:
    830     // we should never need to do a block-copy when initializing a local
    831     // variable, because the local variable's lifetime should be strictly
    832     // contained within the stack block's.
    833     } else if (type.getObjCLifetime() == Qualifiers::OCL_Strong &&
    834                type->isBlockPointerType()) {
    835       // Load the block and do a simple retain.
    836       LValue srcLV = MakeAddrLValue(src, type, align);
    837       llvm::Value *value = EmitLoadOfScalar(srcLV);
    838       value = EmitARCRetainNonBlock(value);
    839 
    840       // Do a primitive store to the block field.
    841       LValue destLV = MakeAddrLValue(blockField, type, align);
    842       EmitStoreOfScalar(value, destLV, /*init*/ true);
    843 
    844     // Otherwise, fake up a POD copy into the block field.
    845     } else {
    846       // Fake up a new variable so that EmitScalarInit doesn't think
    847       // we're referring to the variable in its own initializer.
    848       ImplicitParamDecl blockFieldPseudoVar(/*DC*/ 0, SourceLocation(),
    849                                             /*name*/ 0, type);
    850 
    851       // We use one of these or the other depending on whether the
    852       // reference is nested.
    853       DeclRefExpr declRef(const_cast<VarDecl*>(variable),
    854                           /*refersToEnclosing*/ ci->isNested(), type,
    855                           VK_LValue, SourceLocation());
    856 
    857       ImplicitCastExpr l2r(ImplicitCastExpr::OnStack, type, CK_LValueToRValue,
    858                            &declRef, VK_RValue);
    859       EmitExprAsInit(&l2r, &blockFieldPseudoVar,
    860                      MakeAddrLValue(blockField, type, align),
    861                      /*captured by init*/ false);
    862     }
    863 
    864     // Activate the cleanup if layout pushed one.
    865     if (!ci->isByRef()) {
    866       EHScopeStack::stable_iterator cleanup = capture.getCleanup();
    867       if (cleanup.isValid())
    868         ActivateCleanupBlock(cleanup, blockInfo.DominatingIP);
    869     }
    870   }
    871 
    872   // Cast to the converted block-pointer type, which happens (somewhat
    873   // unfortunately) to be a pointer to function type.
    874   llvm::Value *result =
    875     Builder.CreateBitCast(blockAddr,
    876                           ConvertType(blockInfo.getBlockExpr()->getType()));
    877 
    878   return result;
    879 }
    880 
    881 
    882 llvm::Type *CodeGenModule::getBlockDescriptorType() {
    883   if (BlockDescriptorType)
    884     return BlockDescriptorType;
    885 
    886   llvm::Type *UnsignedLongTy =
    887     getTypes().ConvertType(getContext().UnsignedLongTy);
    888 
    889   // struct __block_descriptor {
    890   //   unsigned long reserved;
    891   //   unsigned long block_size;
    892   //
    893   //   // later, the following will be added
    894   //
    895   //   struct {
    896   //     void (*copyHelper)();
    897   //     void (*copyHelper)();
    898   //   } helpers;                // !!! optional
    899   //
    900   //   const char *signature;   // the block signature
    901   //   const char *layout;      // reserved
    902   // };
    903   BlockDescriptorType =
    904     llvm::StructType::create("struct.__block_descriptor",
    905                              UnsignedLongTy, UnsignedLongTy, NULL);
    906 
    907   // Now form a pointer to that.
    908   BlockDescriptorType = llvm::PointerType::getUnqual(BlockDescriptorType);
    909   return BlockDescriptorType;
    910 }
    911 
    912 llvm::Type *CodeGenModule::getGenericBlockLiteralType() {
    913   if (GenericBlockLiteralType)
    914     return GenericBlockLiteralType;
    915 
    916   llvm::Type *BlockDescPtrTy = getBlockDescriptorType();
    917 
    918   // struct __block_literal_generic {
    919   //   void *__isa;
    920   //   int __flags;
    921   //   int __reserved;
    922   //   void (*__invoke)(void *);
    923   //   struct __block_descriptor *__descriptor;
    924   // };
    925   GenericBlockLiteralType =
    926     llvm::StructType::create("struct.__block_literal_generic",
    927                              VoidPtrTy, IntTy, IntTy, VoidPtrTy,
    928                              BlockDescPtrTy, NULL);
    929 
    930   return GenericBlockLiteralType;
    931 }
    932 
    933 
    934 RValue CodeGenFunction::EmitBlockCallExpr(const CallExpr* E,
    935                                           ReturnValueSlot ReturnValue) {
    936   const BlockPointerType *BPT =
    937     E->getCallee()->getType()->getAs<BlockPointerType>();
    938 
    939   llvm::Value *Callee = EmitScalarExpr(E->getCallee());
    940 
    941   // Get a pointer to the generic block literal.
    942   llvm::Type *BlockLiteralTy =
    943     llvm::PointerType::getUnqual(CGM.getGenericBlockLiteralType());
    944 
    945   // Bitcast the callee to a block literal.
    946   llvm::Value *BlockLiteral =
    947     Builder.CreateBitCast(Callee, BlockLiteralTy, "block.literal");
    948 
    949   // Get the function pointer from the literal.
    950   llvm::Value *FuncPtr = Builder.CreateStructGEP(BlockLiteral, 3);
    951 
    952   BlockLiteral = Builder.CreateBitCast(BlockLiteral, VoidPtrTy);
    953 
    954   // Add the block literal.
    955   CallArgList Args;
    956   Args.add(RValue::get(BlockLiteral), getContext().VoidPtrTy);
    957 
    958   QualType FnType = BPT->getPointeeType();
    959 
    960   // And the rest of the arguments.
    961   EmitCallArgs(Args, FnType->getAs<FunctionProtoType>(),
    962                E->arg_begin(), E->arg_end());
    963 
    964   // Load the function.
    965   llvm::Value *Func = Builder.CreateLoad(FuncPtr);
    966 
    967   const FunctionType *FuncTy = FnType->castAs<FunctionType>();
    968   const CGFunctionInfo &FnInfo =
    969     CGM.getTypes().arrangeBlockFunctionCall(Args, FuncTy);
    970 
    971   // Cast the function pointer to the right type.
    972   llvm::Type *BlockFTy = CGM.getTypes().GetFunctionType(FnInfo);
    973 
    974   llvm::Type *BlockFTyPtr = llvm::PointerType::getUnqual(BlockFTy);
    975   Func = Builder.CreateBitCast(Func, BlockFTyPtr);
    976 
    977   // And call the block.
    978   return EmitCall(FnInfo, Func, ReturnValue, Args);
    979 }
    980 
    981 llvm::Value *CodeGenFunction::GetAddrOfBlockDecl(const VarDecl *variable,
    982                                                  bool isByRef) {
    983   assert(BlockInfo && "evaluating block ref without block information?");
    984   const CGBlockInfo::Capture &capture = BlockInfo->getCapture(variable);
    985 
    986   // Handle constant captures.
    987   if (capture.isConstant()) return LocalDeclMap[variable];
    988 
    989   llvm::Value *addr =
    990     Builder.CreateStructGEP(LoadBlockStruct(), capture.getIndex(),
    991                             "block.capture.addr");
    992 
    993   if (isByRef) {
    994     // addr should be a void** right now.  Load, then cast the result
    995     // to byref*.
    996 
    997     addr = Builder.CreateLoad(addr);
    998     llvm::PointerType *byrefPointerType
    999       = llvm::PointerType::get(BuildByRefType(variable), 0);
   1000     addr = Builder.CreateBitCast(addr, byrefPointerType,
   1001                                  "byref.addr");
   1002 
   1003     // Follow the forwarding pointer.
   1004     addr = Builder.CreateStructGEP(addr, 1, "byref.forwarding");
   1005     addr = Builder.CreateLoad(addr, "byref.addr.forwarded");
   1006 
   1007     // Cast back to byref* and GEP over to the actual object.
   1008     addr = Builder.CreateBitCast(addr, byrefPointerType);
   1009     addr = Builder.CreateStructGEP(addr, getByRefValueLLVMField(variable),
   1010                                    variable->getNameAsString());
   1011   }
   1012 
   1013   if (variable->getType()->isReferenceType())
   1014     addr = Builder.CreateLoad(addr, "ref.tmp");
   1015 
   1016   return addr;
   1017 }
   1018 
   1019 llvm::Constant *
   1020 CodeGenModule::GetAddrOfGlobalBlock(const BlockExpr *blockExpr,
   1021                                     const char *name) {
   1022   CGBlockInfo blockInfo(blockExpr->getBlockDecl(), name);
   1023   blockInfo.BlockExpression = blockExpr;
   1024 
   1025   // Compute information about the layout, etc., of this block.
   1026   computeBlockInfo(*this, 0, blockInfo);
   1027 
   1028   // Using that metadata, generate the actual block function.
   1029   llvm::Constant *blockFn;
   1030   {
   1031     llvm::DenseMap<const Decl*, llvm::Value*> LocalDeclMap;
   1032     blockFn = CodeGenFunction(*this).GenerateBlockFunction(GlobalDecl(),
   1033                                                            blockInfo,
   1034                                                            LocalDeclMap,
   1035                                                            false);
   1036   }
   1037   blockFn = llvm::ConstantExpr::getBitCast(blockFn, VoidPtrTy);
   1038 
   1039   return buildGlobalBlock(*this, blockInfo, blockFn);
   1040 }
   1041 
   1042 static llvm::Constant *buildGlobalBlock(CodeGenModule &CGM,
   1043                                         const CGBlockInfo &blockInfo,
   1044                                         llvm::Constant *blockFn) {
   1045   assert(blockInfo.CanBeGlobal);
   1046 
   1047   // Generate the constants for the block literal initializer.
   1048   llvm::Constant *fields[BlockHeaderSize];
   1049 
   1050   // isa
   1051   fields[0] = CGM.getNSConcreteGlobalBlock();
   1052 
   1053   // __flags
   1054   BlockFlags flags = BLOCK_IS_GLOBAL | BLOCK_HAS_SIGNATURE;
   1055   if (blockInfo.UsesStret) flags |= BLOCK_USE_STRET;
   1056 
   1057   fields[1] = llvm::ConstantInt::get(CGM.IntTy, flags.getBitMask());
   1058 
   1059   // Reserved
   1060   fields[2] = llvm::Constant::getNullValue(CGM.IntTy);
   1061 
   1062   // Function
   1063   fields[3] = blockFn;
   1064 
   1065   // Descriptor
   1066   fields[4] = buildBlockDescriptor(CGM, blockInfo);
   1067 
   1068   llvm::Constant *init = llvm::ConstantStruct::getAnon(fields);
   1069 
   1070   llvm::GlobalVariable *literal =
   1071     new llvm::GlobalVariable(CGM.getModule(),
   1072                              init->getType(),
   1073                              /*constant*/ true,
   1074                              llvm::GlobalVariable::InternalLinkage,
   1075                              init,
   1076                              "__block_literal_global");
   1077   literal->setAlignment(blockInfo.BlockAlign.getQuantity());
   1078 
   1079   // Return a constant of the appropriately-casted type.
   1080   llvm::Type *requiredType =
   1081     CGM.getTypes().ConvertType(blockInfo.getBlockExpr()->getType());
   1082   return llvm::ConstantExpr::getBitCast(literal, requiredType);
   1083 }
   1084 
   1085 llvm::Function *
   1086 CodeGenFunction::GenerateBlockFunction(GlobalDecl GD,
   1087                                        const CGBlockInfo &blockInfo,
   1088                                        const DeclMapTy &ldm,
   1089                                        bool IsLambdaConversionToBlock) {
   1090   const BlockDecl *blockDecl = blockInfo.getBlockDecl();
   1091 
   1092   // Check if we should generate debug info for this block function.
   1093   maybeInitializeDebugInfo();
   1094   CurGD = GD;
   1095 
   1096   BlockInfo = &blockInfo;
   1097 
   1098   // Arrange for local static and local extern declarations to appear
   1099   // to be local to this function as well, in case they're directly
   1100   // referenced in a block.
   1101   for (DeclMapTy::const_iterator i = ldm.begin(), e = ldm.end(); i != e; ++i) {
   1102     const VarDecl *var = dyn_cast<VarDecl>(i->first);
   1103     if (var && !var->hasLocalStorage())
   1104       LocalDeclMap[var] = i->second;
   1105   }
   1106 
   1107   // Begin building the function declaration.
   1108 
   1109   // Build the argument list.
   1110   FunctionArgList args;
   1111 
   1112   // The first argument is the block pointer.  Just take it as a void*
   1113   // and cast it later.
   1114   QualType selfTy = getContext().VoidPtrTy;
   1115   IdentifierInfo *II = &CGM.getContext().Idents.get(".block_descriptor");
   1116 
   1117   ImplicitParamDecl selfDecl(const_cast<BlockDecl*>(blockDecl),
   1118                              SourceLocation(), II, selfTy);
   1119   args.push_back(&selfDecl);
   1120 
   1121   // Now add the rest of the parameters.
   1122   for (BlockDecl::param_const_iterator i = blockDecl->param_begin(),
   1123        e = blockDecl->param_end(); i != e; ++i)
   1124     args.push_back(*i);
   1125 
   1126   // Create the function declaration.
   1127   const FunctionProtoType *fnType = blockInfo.getBlockExpr()->getFunctionType();
   1128   const CGFunctionInfo &fnInfo =
   1129     CGM.getTypes().arrangeFunctionDeclaration(fnType->getResultType(), args,
   1130                                               fnType->getExtInfo(),
   1131                                               fnType->isVariadic());
   1132   if (CGM.ReturnTypeUsesSRet(fnInfo))
   1133     blockInfo.UsesStret = true;
   1134 
   1135   llvm::FunctionType *fnLLVMType = CGM.getTypes().GetFunctionType(fnInfo);
   1136 
   1137   MangleBuffer name;
   1138   CGM.getBlockMangledName(GD, name, blockDecl);
   1139   llvm::Function *fn =
   1140     llvm::Function::Create(fnLLVMType, llvm::GlobalValue::InternalLinkage,
   1141                            name.getString(), &CGM.getModule());
   1142   CGM.SetInternalFunctionAttributes(blockDecl, fn, fnInfo);
   1143 
   1144   // Begin generating the function.
   1145   StartFunction(blockDecl, fnType->getResultType(), fn, fnInfo, args,
   1146                 blockInfo.getBlockExpr()->getBody()->getLocStart());
   1147 
   1148   // Okay.  Undo some of what StartFunction did.
   1149 
   1150   // Pull the 'self' reference out of the local decl map.
   1151   llvm::Value *blockAddr = LocalDeclMap[&selfDecl];
   1152   LocalDeclMap.erase(&selfDecl);
   1153   BlockPointer = Builder.CreateBitCast(blockAddr,
   1154                                        blockInfo.StructureType->getPointerTo(),
   1155                                        "block");
   1156   // At -O0 we generate an explicit alloca for the BlockPointer, so the RA
   1157   // won't delete the dbg.declare intrinsics for captured variables.
   1158   llvm::Value *BlockPointerDbgLoc = BlockPointer;
   1159   if (CGM.getCodeGenOpts().OptimizationLevel == 0) {
   1160     // Allocate a stack slot for it, so we can point the debugger to it
   1161     llvm::AllocaInst *Alloca = CreateTempAlloca(BlockPointer->getType(),
   1162                                                 "block.addr");
   1163     unsigned Align = getContext().getDeclAlign(&selfDecl).getQuantity();
   1164     Alloca->setAlignment(Align);
   1165     // Set the DebugLocation to empty, so the store is recognized as a
   1166     // frame setup instruction by llvm::DwarfDebug::beginFunction().
   1167     NoLocation NL(*this, Builder);
   1168     Builder.CreateAlignedStore(BlockPointer, Alloca, Align);
   1169     BlockPointerDbgLoc = Alloca;
   1170   }
   1171 
   1172   // If we have a C++ 'this' reference, go ahead and force it into
   1173   // existence now.
   1174   if (blockDecl->capturesCXXThis()) {
   1175     llvm::Value *addr = Builder.CreateStructGEP(BlockPointer,
   1176                                                 blockInfo.CXXThisIndex,
   1177                                                 "block.captured-this");
   1178     CXXThisValue = Builder.CreateLoad(addr, "this");
   1179   }
   1180 
   1181   // Also force all the constant captures.
   1182   for (BlockDecl::capture_const_iterator ci = blockDecl->capture_begin(),
   1183          ce = blockDecl->capture_end(); ci != ce; ++ci) {
   1184     const VarDecl *variable = ci->getVariable();
   1185     const CGBlockInfo::Capture &capture = blockInfo.getCapture(variable);
   1186     if (!capture.isConstant()) continue;
   1187 
   1188     unsigned align = getContext().getDeclAlign(variable).getQuantity();
   1189 
   1190     llvm::AllocaInst *alloca =
   1191       CreateMemTemp(variable->getType(), "block.captured-const");
   1192     alloca->setAlignment(align);
   1193 
   1194     Builder.CreateAlignedStore(capture.getConstant(), alloca, align);
   1195 
   1196     LocalDeclMap[variable] = alloca;
   1197   }
   1198 
   1199   // Save a spot to insert the debug information for all the DeclRefExprs.
   1200   llvm::BasicBlock *entry = Builder.GetInsertBlock();
   1201   llvm::BasicBlock::iterator entry_ptr = Builder.GetInsertPoint();
   1202   --entry_ptr;
   1203 
   1204   if (IsLambdaConversionToBlock)
   1205     EmitLambdaBlockInvokeBody();
   1206   else
   1207     EmitStmt(blockDecl->getBody());
   1208 
   1209   // Remember where we were...
   1210   llvm::BasicBlock *resume = Builder.GetInsertBlock();
   1211 
   1212   // Go back to the entry.
   1213   ++entry_ptr;
   1214   Builder.SetInsertPoint(entry, entry_ptr);
   1215 
   1216   // Emit debug information for all the DeclRefExprs.
   1217   // FIXME: also for 'this'
   1218   if (CGDebugInfo *DI = getDebugInfo()) {
   1219     for (BlockDecl::capture_const_iterator ci = blockDecl->capture_begin(),
   1220            ce = blockDecl->capture_end(); ci != ce; ++ci) {
   1221       const VarDecl *variable = ci->getVariable();
   1222       DI->EmitLocation(Builder, variable->getLocation());
   1223 
   1224       if (CGM.getCodeGenOpts().getDebugInfo()
   1225             >= CodeGenOptions::LimitedDebugInfo) {
   1226         const CGBlockInfo::Capture &capture = blockInfo.getCapture(variable);
   1227         if (capture.isConstant()) {
   1228           DI->EmitDeclareOfAutoVariable(variable, LocalDeclMap[variable],
   1229                                         Builder);
   1230           continue;
   1231         }
   1232 
   1233         DI->EmitDeclareOfBlockDeclRefVariable(variable, BlockPointerDbgLoc,
   1234                                               Builder, blockInfo);
   1235       }
   1236     }
   1237     // Recover location if it was changed in the above loop.
   1238     DI->EmitLocation(Builder,
   1239                      cast<CompoundStmt>(blockDecl->getBody())->getRBracLoc());
   1240   }
   1241 
   1242   // And resume where we left off.
   1243   if (resume == 0)
   1244     Builder.ClearInsertionPoint();
   1245   else
   1246     Builder.SetInsertPoint(resume);
   1247 
   1248   FinishFunction(cast<CompoundStmt>(blockDecl->getBody())->getRBracLoc());
   1249 
   1250   return fn;
   1251 }
   1252 
   1253 /*
   1254     notes.push_back(HelperInfo());
   1255     HelperInfo &note = notes.back();
   1256     note.index = capture.getIndex();
   1257     note.RequiresCopying = (ci->hasCopyExpr() || BlockRequiresCopying(type));
   1258     note.cxxbar_import = ci->getCopyExpr();
   1259 
   1260     if (ci->isByRef()) {
   1261       note.flag = BLOCK_FIELD_IS_BYREF;
   1262       if (type.isObjCGCWeak())
   1263         note.flag |= BLOCK_FIELD_IS_WEAK;
   1264     } else if (type->isBlockPointerType()) {
   1265       note.flag = BLOCK_FIELD_IS_BLOCK;
   1266     } else {
   1267       note.flag = BLOCK_FIELD_IS_OBJECT;
   1268     }
   1269  */
   1270 
   1271 
   1272 /// Generate the copy-helper function for a block closure object:
   1273 ///   static void block_copy_helper(block_t *dst, block_t *src);
   1274 /// The runtime will have previously initialized 'dst' by doing a
   1275 /// bit-copy of 'src'.
   1276 ///
   1277 /// Note that this copies an entire block closure object to the heap;
   1278 /// it should not be confused with a 'byref copy helper', which moves
   1279 /// the contents of an individual __block variable to the heap.
   1280 llvm::Constant *
   1281 CodeGenFunction::GenerateCopyHelperFunction(const CGBlockInfo &blockInfo) {
   1282   ASTContext &C = getContext();
   1283 
   1284   FunctionArgList args;
   1285   ImplicitParamDecl dstDecl(0, SourceLocation(), 0, C.VoidPtrTy);
   1286   args.push_back(&dstDecl);
   1287   ImplicitParamDecl srcDecl(0, SourceLocation(), 0, C.VoidPtrTy);
   1288   args.push_back(&srcDecl);
   1289 
   1290   const CGFunctionInfo &FI =
   1291     CGM.getTypes().arrangeFunctionDeclaration(C.VoidTy, args,
   1292                                               FunctionType::ExtInfo(),
   1293                                               /*variadic*/ false);
   1294 
   1295   // FIXME: it would be nice if these were mergeable with things with
   1296   // identical semantics.
   1297   llvm::FunctionType *LTy = CGM.getTypes().GetFunctionType(FI);
   1298 
   1299   llvm::Function *Fn =
   1300     llvm::Function::Create(LTy, llvm::GlobalValue::InternalLinkage,
   1301                            "__copy_helper_block_", &CGM.getModule());
   1302 
   1303   IdentifierInfo *II
   1304     = &CGM.getContext().Idents.get("__copy_helper_block_");
   1305 
   1306   // Check if we should generate debug info for this block helper function.
   1307   maybeInitializeDebugInfo();
   1308 
   1309   FunctionDecl *FD = FunctionDecl::Create(C,
   1310                                           C.getTranslationUnitDecl(),
   1311                                           SourceLocation(),
   1312                                           SourceLocation(), II, C.VoidTy, 0,
   1313                                           SC_Static,
   1314                                           false,
   1315                                           false);
   1316   // Create a scope with an artificial location for the body of this function.
   1317   ArtificialLocation AL(*this, Builder);
   1318   StartFunction(FD, C.VoidTy, Fn, FI, args, SourceLocation());
   1319   AL.Emit();
   1320 
   1321   llvm::Type *structPtrTy = blockInfo.StructureType->getPointerTo();
   1322 
   1323   llvm::Value *src = GetAddrOfLocalVar(&srcDecl);
   1324   src = Builder.CreateLoad(src);
   1325   src = Builder.CreateBitCast(src, structPtrTy, "block.source");
   1326 
   1327   llvm::Value *dst = GetAddrOfLocalVar(&dstDecl);
   1328   dst = Builder.CreateLoad(dst);
   1329   dst = Builder.CreateBitCast(dst, structPtrTy, "block.dest");
   1330 
   1331   const BlockDecl *blockDecl = blockInfo.getBlockDecl();
   1332 
   1333   for (BlockDecl::capture_const_iterator ci = blockDecl->capture_begin(),
   1334          ce = blockDecl->capture_end(); ci != ce; ++ci) {
   1335     const VarDecl *variable = ci->getVariable();
   1336     QualType type = variable->getType();
   1337 
   1338     const CGBlockInfo::Capture &capture = blockInfo.getCapture(variable);
   1339     if (capture.isConstant()) continue;
   1340 
   1341     const Expr *copyExpr = ci->getCopyExpr();
   1342     BlockFieldFlags flags;
   1343 
   1344     bool useARCWeakCopy = false;
   1345     bool useARCStrongCopy = false;
   1346 
   1347     if (copyExpr) {
   1348       assert(!ci->isByRef());
   1349       // don't bother computing flags
   1350 
   1351     } else if (ci->isByRef()) {
   1352       flags = BLOCK_FIELD_IS_BYREF;
   1353       if (type.isObjCGCWeak())
   1354         flags |= BLOCK_FIELD_IS_WEAK;
   1355 
   1356     } else if (type->isObjCRetainableType()) {
   1357       flags = BLOCK_FIELD_IS_OBJECT;
   1358       bool isBlockPointer = type->isBlockPointerType();
   1359       if (isBlockPointer)
   1360         flags = BLOCK_FIELD_IS_BLOCK;
   1361 
   1362       // Special rules for ARC captures:
   1363       if (getLangOpts().ObjCAutoRefCount) {
   1364         Qualifiers qs = type.getQualifiers();
   1365 
   1366         // We need to register __weak direct captures with the runtime.
   1367         if (qs.getObjCLifetime() == Qualifiers::OCL_Weak) {
   1368           useARCWeakCopy = true;
   1369 
   1370         // We need to retain the copied value for __strong direct captures.
   1371         } else if (qs.getObjCLifetime() == Qualifiers::OCL_Strong) {
   1372           // If it's a block pointer, we have to copy the block and
   1373           // assign that to the destination pointer, so we might as
   1374           // well use _Block_object_assign.  Otherwise we can avoid that.
   1375           if (!isBlockPointer)
   1376             useARCStrongCopy = true;
   1377 
   1378         // Otherwise the memcpy is fine.
   1379         } else {
   1380           continue;
   1381         }
   1382 
   1383       // Non-ARC captures of retainable pointers are strong and
   1384       // therefore require a call to _Block_object_assign.
   1385       } else {
   1386         // fall through
   1387       }
   1388     } else {
   1389       continue;
   1390     }
   1391 
   1392     unsigned index = capture.getIndex();
   1393     llvm::Value *srcField = Builder.CreateStructGEP(src, index);
   1394     llvm::Value *dstField = Builder.CreateStructGEP(dst, index);
   1395 
   1396     // If there's an explicit copy expression, we do that.
   1397     if (copyExpr) {
   1398       EmitSynthesizedCXXCopyCtor(dstField, srcField, copyExpr);
   1399     } else if (useARCWeakCopy) {
   1400       EmitARCCopyWeak(dstField, srcField);
   1401     } else {
   1402       llvm::Value *srcValue = Builder.CreateLoad(srcField, "blockcopy.src");
   1403       if (useARCStrongCopy) {
   1404         // At -O0, store null into the destination field (so that the
   1405         // storeStrong doesn't over-release) and then call storeStrong.
   1406         // This is a workaround to not having an initStrong call.
   1407         if (CGM.getCodeGenOpts().OptimizationLevel == 0) {
   1408           llvm::PointerType *ty = cast<llvm::PointerType>(srcValue->getType());
   1409           llvm::Value *null = llvm::ConstantPointerNull::get(ty);
   1410           Builder.CreateStore(null, dstField);
   1411           EmitARCStoreStrongCall(dstField, srcValue, true);
   1412 
   1413         // With optimization enabled, take advantage of the fact that
   1414         // the blocks runtime guarantees a memcpy of the block data, and
   1415         // just emit a retain of the src field.
   1416         } else {
   1417           EmitARCRetainNonBlock(srcValue);
   1418 
   1419           // We don't need this anymore, so kill it.  It's not quite
   1420           // worth the annoyance to avoid creating it in the first place.
   1421           cast<llvm::Instruction>(dstField)->eraseFromParent();
   1422         }
   1423       } else {
   1424         srcValue = Builder.CreateBitCast(srcValue, VoidPtrTy);
   1425         llvm::Value *dstAddr = Builder.CreateBitCast(dstField, VoidPtrTy);
   1426         llvm::Value *args[] = {
   1427           dstAddr, srcValue, llvm::ConstantInt::get(Int32Ty, flags.getBitMask())
   1428         };
   1429 
   1430         bool copyCanThrow = false;
   1431         if (ci->isByRef() && variable->getType()->getAsCXXRecordDecl()) {
   1432           const Expr *copyExpr =
   1433             CGM.getContext().getBlockVarCopyInits(variable);
   1434           if (copyExpr) {
   1435             copyCanThrow = true; // FIXME: reuse the noexcept logic
   1436           }
   1437         }
   1438 
   1439         if (copyCanThrow) {
   1440           EmitRuntimeCallOrInvoke(CGM.getBlockObjectAssign(), args);
   1441         } else {
   1442           EmitNounwindRuntimeCall(CGM.getBlockObjectAssign(), args);
   1443         }
   1444       }
   1445     }
   1446   }
   1447 
   1448   FinishFunction();
   1449 
   1450   return llvm::ConstantExpr::getBitCast(Fn, VoidPtrTy);
   1451 }
   1452 
   1453 /// Generate the destroy-helper function for a block closure object:
   1454 ///   static void block_destroy_helper(block_t *theBlock);
   1455 ///
   1456 /// Note that this destroys a heap-allocated block closure object;
   1457 /// it should not be confused with a 'byref destroy helper', which
   1458 /// destroys the heap-allocated contents of an individual __block
   1459 /// variable.
   1460 llvm::Constant *
   1461 CodeGenFunction::GenerateDestroyHelperFunction(const CGBlockInfo &blockInfo) {
   1462   ASTContext &C = getContext();
   1463 
   1464   FunctionArgList args;
   1465   ImplicitParamDecl srcDecl(0, SourceLocation(), 0, C.VoidPtrTy);
   1466   args.push_back(&srcDecl);
   1467 
   1468   const CGFunctionInfo &FI =
   1469     CGM.getTypes().arrangeFunctionDeclaration(C.VoidTy, args,
   1470                                               FunctionType::ExtInfo(),
   1471                                               /*variadic*/ false);
   1472 
   1473   // FIXME: We'd like to put these into a mergable by content, with
   1474   // internal linkage.
   1475   llvm::FunctionType *LTy = CGM.getTypes().GetFunctionType(FI);
   1476 
   1477   llvm::Function *Fn =
   1478     llvm::Function::Create(LTy, llvm::GlobalValue::InternalLinkage,
   1479                            "__destroy_helper_block_", &CGM.getModule());
   1480 
   1481   // Check if we should generate debug info for this block destroy function.
   1482   maybeInitializeDebugInfo();
   1483 
   1484   IdentifierInfo *II
   1485     = &CGM.getContext().Idents.get("__destroy_helper_block_");
   1486 
   1487   FunctionDecl *FD = FunctionDecl::Create(C, C.getTranslationUnitDecl(),
   1488                                           SourceLocation(),
   1489                                           SourceLocation(), II, C.VoidTy, 0,
   1490                                           SC_Static,
   1491                                           false, false);
   1492   // Create a scope with an artificial location for the body of this function.
   1493   ArtificialLocation AL(*this, Builder);
   1494   StartFunction(FD, C.VoidTy, Fn, FI, args, SourceLocation());
   1495   AL.Emit();
   1496 
   1497   llvm::Type *structPtrTy = blockInfo.StructureType->getPointerTo();
   1498 
   1499   llvm::Value *src = GetAddrOfLocalVar(&srcDecl);
   1500   src = Builder.CreateLoad(src);
   1501   src = Builder.CreateBitCast(src, structPtrTy, "block");
   1502 
   1503   const BlockDecl *blockDecl = blockInfo.getBlockDecl();
   1504 
   1505   CodeGenFunction::RunCleanupsScope cleanups(*this);
   1506 
   1507   for (BlockDecl::capture_const_iterator ci = blockDecl->capture_begin(),
   1508          ce = blockDecl->capture_end(); ci != ce; ++ci) {
   1509     const VarDecl *variable = ci->getVariable();
   1510     QualType type = variable->getType();
   1511 
   1512     const CGBlockInfo::Capture &capture = blockInfo.getCapture(variable);
   1513     if (capture.isConstant()) continue;
   1514 
   1515     BlockFieldFlags flags;
   1516     const CXXDestructorDecl *dtor = 0;
   1517 
   1518     bool useARCWeakDestroy = false;
   1519     bool useARCStrongDestroy = false;
   1520 
   1521     if (ci->isByRef()) {
   1522       flags = BLOCK_FIELD_IS_BYREF;
   1523       if (type.isObjCGCWeak())
   1524         flags |= BLOCK_FIELD_IS_WEAK;
   1525     } else if (const CXXRecordDecl *record = type->getAsCXXRecordDecl()) {
   1526       if (record->hasTrivialDestructor())
   1527         continue;
   1528       dtor = record->getDestructor();
   1529     } else if (type->isObjCRetainableType()) {
   1530       flags = BLOCK_FIELD_IS_OBJECT;
   1531       if (type->isBlockPointerType())
   1532         flags = BLOCK_FIELD_IS_BLOCK;
   1533 
   1534       // Special rules for ARC captures.
   1535       if (getLangOpts().ObjCAutoRefCount) {
   1536         Qualifiers qs = type.getQualifiers();
   1537 
   1538         // Don't generate special dispose logic for a captured object
   1539         // unless it's __strong or __weak.
   1540         if (!qs.hasStrongOrWeakObjCLifetime())
   1541           continue;
   1542 
   1543         // Support __weak direct captures.
   1544         if (qs.getObjCLifetime() == Qualifiers::OCL_Weak)
   1545           useARCWeakDestroy = true;
   1546 
   1547         // Tools really want us to use objc_storeStrong here.
   1548         else
   1549           useARCStrongDestroy = true;
   1550       }
   1551     } else {
   1552       continue;
   1553     }
   1554 
   1555     unsigned index = capture.getIndex();
   1556     llvm::Value *srcField = Builder.CreateStructGEP(src, index);
   1557 
   1558     // If there's an explicit copy expression, we do that.
   1559     if (dtor) {
   1560       PushDestructorCleanup(dtor, srcField);
   1561 
   1562     // If this is a __weak capture, emit the release directly.
   1563     } else if (useARCWeakDestroy) {
   1564       EmitARCDestroyWeak(srcField);
   1565 
   1566     // Destroy strong objects with a call if requested.
   1567     } else if (useARCStrongDestroy) {
   1568       EmitARCDestroyStrong(srcField, ARCImpreciseLifetime);
   1569 
   1570     // Otherwise we call _Block_object_dispose.  It wouldn't be too
   1571     // hard to just emit this as a cleanup if we wanted to make sure
   1572     // that things were done in reverse.
   1573     } else {
   1574       llvm::Value *value = Builder.CreateLoad(srcField);
   1575       value = Builder.CreateBitCast(value, VoidPtrTy);
   1576       BuildBlockRelease(value, flags);
   1577     }
   1578   }
   1579 
   1580   cleanups.ForceCleanup();
   1581 
   1582   FinishFunction();
   1583 
   1584   return llvm::ConstantExpr::getBitCast(Fn, VoidPtrTy);
   1585 }
   1586 
   1587 namespace {
   1588 
   1589 /// Emits the copy/dispose helper functions for a __block object of id type.
   1590 class ObjectByrefHelpers : public CodeGenModule::ByrefHelpers {
   1591   BlockFieldFlags Flags;
   1592 
   1593 public:
   1594   ObjectByrefHelpers(CharUnits alignment, BlockFieldFlags flags)
   1595     : ByrefHelpers(alignment), Flags(flags) {}
   1596 
   1597   void emitCopy(CodeGenFunction &CGF, llvm::Value *destField,
   1598                 llvm::Value *srcField) {
   1599     destField = CGF.Builder.CreateBitCast(destField, CGF.VoidPtrTy);
   1600 
   1601     srcField = CGF.Builder.CreateBitCast(srcField, CGF.VoidPtrPtrTy);
   1602     llvm::Value *srcValue = CGF.Builder.CreateLoad(srcField);
   1603 
   1604     unsigned flags = (Flags | BLOCK_BYREF_CALLER).getBitMask();
   1605 
   1606     llvm::Value *flagsVal = llvm::ConstantInt::get(CGF.Int32Ty, flags);
   1607     llvm::Value *fn = CGF.CGM.getBlockObjectAssign();
   1608 
   1609     llvm::Value *args[] = { destField, srcValue, flagsVal };
   1610     CGF.EmitNounwindRuntimeCall(fn, args);
   1611   }
   1612 
   1613   void emitDispose(CodeGenFunction &CGF, llvm::Value *field) {
   1614     field = CGF.Builder.CreateBitCast(field, CGF.Int8PtrTy->getPointerTo(0));
   1615     llvm::Value *value = CGF.Builder.CreateLoad(field);
   1616 
   1617     CGF.BuildBlockRelease(value, Flags | BLOCK_BYREF_CALLER);
   1618   }
   1619 
   1620   void profileImpl(llvm::FoldingSetNodeID &id) const {
   1621     id.AddInteger(Flags.getBitMask());
   1622   }
   1623 };
   1624 
   1625 /// Emits the copy/dispose helpers for an ARC __block __weak variable.
   1626 class ARCWeakByrefHelpers : public CodeGenModule::ByrefHelpers {
   1627 public:
   1628   ARCWeakByrefHelpers(CharUnits alignment) : ByrefHelpers(alignment) {}
   1629 
   1630   void emitCopy(CodeGenFunction &CGF, llvm::Value *destField,
   1631                 llvm::Value *srcField) {
   1632     CGF.EmitARCMoveWeak(destField, srcField);
   1633   }
   1634 
   1635   void emitDispose(CodeGenFunction &CGF, llvm::Value *field) {
   1636     CGF.EmitARCDestroyWeak(field);
   1637   }
   1638 
   1639   void profileImpl(llvm::FoldingSetNodeID &id) const {
   1640     // 0 is distinguishable from all pointers and byref flags
   1641     id.AddInteger(0);
   1642   }
   1643 };
   1644 
   1645 /// Emits the copy/dispose helpers for an ARC __block __strong variable
   1646 /// that's not of block-pointer type.
   1647 class ARCStrongByrefHelpers : public CodeGenModule::ByrefHelpers {
   1648 public:
   1649   ARCStrongByrefHelpers(CharUnits alignment) : ByrefHelpers(alignment) {}
   1650 
   1651   void emitCopy(CodeGenFunction &CGF, llvm::Value *destField,
   1652                 llvm::Value *srcField) {
   1653     // Do a "move" by copying the value and then zeroing out the old
   1654     // variable.
   1655 
   1656     llvm::LoadInst *value = CGF.Builder.CreateLoad(srcField);
   1657     value->setAlignment(Alignment.getQuantity());
   1658 
   1659     llvm::Value *null =
   1660       llvm::ConstantPointerNull::get(cast<llvm::PointerType>(value->getType()));
   1661 
   1662     if (CGF.CGM.getCodeGenOpts().OptimizationLevel == 0) {
   1663       llvm::StoreInst *store = CGF.Builder.CreateStore(null, destField);
   1664       store->setAlignment(Alignment.getQuantity());
   1665       CGF.EmitARCStoreStrongCall(destField, value, /*ignored*/ true);
   1666       CGF.EmitARCStoreStrongCall(srcField, null, /*ignored*/ true);
   1667       return;
   1668     }
   1669     llvm::StoreInst *store = CGF.Builder.CreateStore(value, destField);
   1670     store->setAlignment(Alignment.getQuantity());
   1671 
   1672     store = CGF.Builder.CreateStore(null, srcField);
   1673     store->setAlignment(Alignment.getQuantity());
   1674   }
   1675 
   1676   void emitDispose(CodeGenFunction &CGF, llvm::Value *field) {
   1677     CGF.EmitARCDestroyStrong(field, ARCImpreciseLifetime);
   1678   }
   1679 
   1680   void profileImpl(llvm::FoldingSetNodeID &id) const {
   1681     // 1 is distinguishable from all pointers and byref flags
   1682     id.AddInteger(1);
   1683   }
   1684 };
   1685 
   1686 /// Emits the copy/dispose helpers for an ARC __block __strong
   1687 /// variable that's of block-pointer type.
   1688 class ARCStrongBlockByrefHelpers : public CodeGenModule::ByrefHelpers {
   1689 public:
   1690   ARCStrongBlockByrefHelpers(CharUnits alignment) : ByrefHelpers(alignment) {}
   1691 
   1692   void emitCopy(CodeGenFunction &CGF, llvm::Value *destField,
   1693                 llvm::Value *srcField) {
   1694     // Do the copy with objc_retainBlock; that's all that
   1695     // _Block_object_assign would do anyway, and we'd have to pass the
   1696     // right arguments to make sure it doesn't get no-op'ed.
   1697     llvm::LoadInst *oldValue = CGF.Builder.CreateLoad(srcField);
   1698     oldValue->setAlignment(Alignment.getQuantity());
   1699 
   1700     llvm::Value *copy = CGF.EmitARCRetainBlock(oldValue, /*mandatory*/ true);
   1701 
   1702     llvm::StoreInst *store = CGF.Builder.CreateStore(copy, destField);
   1703     store->setAlignment(Alignment.getQuantity());
   1704   }
   1705 
   1706   void emitDispose(CodeGenFunction &CGF, llvm::Value *field) {
   1707     CGF.EmitARCDestroyStrong(field, ARCImpreciseLifetime);
   1708   }
   1709 
   1710   void profileImpl(llvm::FoldingSetNodeID &id) const {
   1711     // 2 is distinguishable from all pointers and byref flags
   1712     id.AddInteger(2);
   1713   }
   1714 };
   1715 
   1716 /// Emits the copy/dispose helpers for a __block variable with a
   1717 /// nontrivial copy constructor or destructor.
   1718 class CXXByrefHelpers : public CodeGenModule::ByrefHelpers {
   1719   QualType VarType;
   1720   const Expr *CopyExpr;
   1721 
   1722 public:
   1723   CXXByrefHelpers(CharUnits alignment, QualType type,
   1724                   const Expr *copyExpr)
   1725     : ByrefHelpers(alignment), VarType(type), CopyExpr(copyExpr) {}
   1726 
   1727   bool needsCopy() const { return CopyExpr != 0; }
   1728   void emitCopy(CodeGenFunction &CGF, llvm::Value *destField,
   1729                 llvm::Value *srcField) {
   1730     if (!CopyExpr) return;
   1731     CGF.EmitSynthesizedCXXCopyCtor(destField, srcField, CopyExpr);
   1732   }
   1733 
   1734   void emitDispose(CodeGenFunction &CGF, llvm::Value *field) {
   1735     EHScopeStack::stable_iterator cleanupDepth = CGF.EHStack.stable_begin();
   1736     CGF.PushDestructorCleanup(VarType, field);
   1737     CGF.PopCleanupBlocks(cleanupDepth);
   1738   }
   1739 
   1740   void profileImpl(llvm::FoldingSetNodeID &id) const {
   1741     id.AddPointer(VarType.getCanonicalType().getAsOpaquePtr());
   1742   }
   1743 };
   1744 } // end anonymous namespace
   1745 
   1746 static llvm::Constant *
   1747 generateByrefCopyHelper(CodeGenFunction &CGF,
   1748                         llvm::StructType &byrefType,
   1749                         unsigned valueFieldIndex,
   1750                         CodeGenModule::ByrefHelpers &byrefInfo) {
   1751   ASTContext &Context = CGF.getContext();
   1752 
   1753   QualType R = Context.VoidTy;
   1754 
   1755   FunctionArgList args;
   1756   ImplicitParamDecl dst(0, SourceLocation(), 0, Context.VoidPtrTy);
   1757   args.push_back(&dst);
   1758 
   1759   ImplicitParamDecl src(0, SourceLocation(), 0, Context.VoidPtrTy);
   1760   args.push_back(&src);
   1761 
   1762   const CGFunctionInfo &FI =
   1763     CGF.CGM.getTypes().arrangeFunctionDeclaration(R, args,
   1764                                                   FunctionType::ExtInfo(),
   1765                                                   /*variadic*/ false);
   1766 
   1767   CodeGenTypes &Types = CGF.CGM.getTypes();
   1768   llvm::FunctionType *LTy = Types.GetFunctionType(FI);
   1769 
   1770   // FIXME: We'd like to put these into a mergable by content, with
   1771   // internal linkage.
   1772   llvm::Function *Fn =
   1773     llvm::Function::Create(LTy, llvm::GlobalValue::InternalLinkage,
   1774                            "__Block_byref_object_copy_", &CGF.CGM.getModule());
   1775 
   1776   IdentifierInfo *II
   1777     = &Context.Idents.get("__Block_byref_object_copy_");
   1778 
   1779   FunctionDecl *FD = FunctionDecl::Create(Context,
   1780                                           Context.getTranslationUnitDecl(),
   1781                                           SourceLocation(),
   1782                                           SourceLocation(), II, R, 0,
   1783                                           SC_Static,
   1784                                           false, false);
   1785 
   1786   // Initialize debug info if necessary.
   1787   CGF.maybeInitializeDebugInfo();
   1788   CGF.StartFunction(FD, R, Fn, FI, args, SourceLocation());
   1789 
   1790   if (byrefInfo.needsCopy()) {
   1791     llvm::Type *byrefPtrType = byrefType.getPointerTo(0);
   1792 
   1793     // dst->x
   1794     llvm::Value *destField = CGF.GetAddrOfLocalVar(&dst);
   1795     destField = CGF.Builder.CreateLoad(destField);
   1796     destField = CGF.Builder.CreateBitCast(destField, byrefPtrType);
   1797     destField = CGF.Builder.CreateStructGEP(destField, valueFieldIndex, "x");
   1798 
   1799     // src->x
   1800     llvm::Value *srcField = CGF.GetAddrOfLocalVar(&src);
   1801     srcField = CGF.Builder.CreateLoad(srcField);
   1802     srcField = CGF.Builder.CreateBitCast(srcField, byrefPtrType);
   1803     srcField = CGF.Builder.CreateStructGEP(srcField, valueFieldIndex, "x");
   1804 
   1805     byrefInfo.emitCopy(CGF, destField, srcField);
   1806   }
   1807 
   1808   CGF.FinishFunction();
   1809 
   1810   return llvm::ConstantExpr::getBitCast(Fn, CGF.Int8PtrTy);
   1811 }
   1812 
   1813 /// Build the copy helper for a __block variable.
   1814 static llvm::Constant *buildByrefCopyHelper(CodeGenModule &CGM,
   1815                                             llvm::StructType &byrefType,
   1816                                             unsigned byrefValueIndex,
   1817                                             CodeGenModule::ByrefHelpers &info) {
   1818   CodeGenFunction CGF(CGM);
   1819   return generateByrefCopyHelper(CGF, byrefType, byrefValueIndex, info);
   1820 }
   1821 
   1822 /// Generate code for a __block variable's dispose helper.
   1823 static llvm::Constant *
   1824 generateByrefDisposeHelper(CodeGenFunction &CGF,
   1825                            llvm::StructType &byrefType,
   1826                            unsigned byrefValueIndex,
   1827                            CodeGenModule::ByrefHelpers &byrefInfo) {
   1828   ASTContext &Context = CGF.getContext();
   1829   QualType R = Context.VoidTy;
   1830 
   1831   FunctionArgList args;
   1832   ImplicitParamDecl src(0, SourceLocation(), 0, Context.VoidPtrTy);
   1833   args.push_back(&src);
   1834 
   1835   const CGFunctionInfo &FI =
   1836     CGF.CGM.getTypes().arrangeFunctionDeclaration(R, args,
   1837                                                   FunctionType::ExtInfo(),
   1838                                                   /*variadic*/ false);
   1839 
   1840   CodeGenTypes &Types = CGF.CGM.getTypes();
   1841   llvm::FunctionType *LTy = Types.GetFunctionType(FI);
   1842 
   1843   // FIXME: We'd like to put these into a mergable by content, with
   1844   // internal linkage.
   1845   llvm::Function *Fn =
   1846     llvm::Function::Create(LTy, llvm::GlobalValue::InternalLinkage,
   1847                            "__Block_byref_object_dispose_",
   1848                            &CGF.CGM.getModule());
   1849 
   1850   IdentifierInfo *II
   1851     = &Context.Idents.get("__Block_byref_object_dispose_");
   1852 
   1853   FunctionDecl *FD = FunctionDecl::Create(Context,
   1854                                           Context.getTranslationUnitDecl(),
   1855                                           SourceLocation(),
   1856                                           SourceLocation(), II, R, 0,
   1857                                           SC_Static,
   1858                                           false, false);
   1859   // Initialize debug info if necessary.
   1860   CGF.maybeInitializeDebugInfo();
   1861   CGF.StartFunction(FD, R, Fn, FI, args, SourceLocation());
   1862 
   1863   if (byrefInfo.needsDispose()) {
   1864     llvm::Value *V = CGF.GetAddrOfLocalVar(&src);
   1865     V = CGF.Builder.CreateLoad(V);
   1866     V = CGF.Builder.CreateBitCast(V, byrefType.getPointerTo(0));
   1867     V = CGF.Builder.CreateStructGEP(V, byrefValueIndex, "x");
   1868 
   1869     byrefInfo.emitDispose(CGF, V);
   1870   }
   1871 
   1872   CGF.FinishFunction();
   1873 
   1874   return llvm::ConstantExpr::getBitCast(Fn, CGF.Int8PtrTy);
   1875 }
   1876 
   1877 /// Build the dispose helper for a __block variable.
   1878 static llvm::Constant *buildByrefDisposeHelper(CodeGenModule &CGM,
   1879                                               llvm::StructType &byrefType,
   1880                                                unsigned byrefValueIndex,
   1881                                             CodeGenModule::ByrefHelpers &info) {
   1882   CodeGenFunction CGF(CGM);
   1883   return generateByrefDisposeHelper(CGF, byrefType, byrefValueIndex, info);
   1884 }
   1885 
   1886 /// Lazily build the copy and dispose helpers for a __block variable
   1887 /// with the given information.
   1888 template <class T> static T *buildByrefHelpers(CodeGenModule &CGM,
   1889                                                llvm::StructType &byrefTy,
   1890                                                unsigned byrefValueIndex,
   1891                                                T &byrefInfo) {
   1892   // Increase the field's alignment to be at least pointer alignment,
   1893   // since the layout of the byref struct will guarantee at least that.
   1894   byrefInfo.Alignment = std::max(byrefInfo.Alignment,
   1895                               CharUnits::fromQuantity(CGM.PointerAlignInBytes));
   1896 
   1897   llvm::FoldingSetNodeID id;
   1898   byrefInfo.Profile(id);
   1899 
   1900   void *insertPos;
   1901   CodeGenModule::ByrefHelpers *node
   1902     = CGM.ByrefHelpersCache.FindNodeOrInsertPos(id, insertPos);
   1903   if (node) return static_cast<T*>(node);
   1904 
   1905   byrefInfo.CopyHelper =
   1906     buildByrefCopyHelper(CGM, byrefTy, byrefValueIndex, byrefInfo);
   1907   byrefInfo.DisposeHelper =
   1908     buildByrefDisposeHelper(CGM, byrefTy, byrefValueIndex,byrefInfo);
   1909 
   1910   T *copy = new (CGM.getContext()) T(byrefInfo);
   1911   CGM.ByrefHelpersCache.InsertNode(copy, insertPos);
   1912   return copy;
   1913 }
   1914 
   1915 /// Build the copy and dispose helpers for the given __block variable
   1916 /// emission.  Places the helpers in the global cache.  Returns null
   1917 /// if no helpers are required.
   1918 CodeGenModule::ByrefHelpers *
   1919 CodeGenFunction::buildByrefHelpers(llvm::StructType &byrefType,
   1920                                    const AutoVarEmission &emission) {
   1921   const VarDecl &var = *emission.Variable;
   1922   QualType type = var.getType();
   1923 
   1924   unsigned byrefValueIndex = getByRefValueLLVMField(&var);
   1925 
   1926   if (const CXXRecordDecl *record = type->getAsCXXRecordDecl()) {
   1927     const Expr *copyExpr = CGM.getContext().getBlockVarCopyInits(&var);
   1928     if (!copyExpr && record->hasTrivialDestructor()) return 0;
   1929 
   1930     CXXByrefHelpers byrefInfo(emission.Alignment, type, copyExpr);
   1931     return ::buildByrefHelpers(CGM, byrefType, byrefValueIndex, byrefInfo);
   1932   }
   1933 
   1934   // Otherwise, if we don't have a retainable type, there's nothing to do.
   1935   // that the runtime does extra copies.
   1936   if (!type->isObjCRetainableType()) return 0;
   1937 
   1938   Qualifiers qs = type.getQualifiers();
   1939 
   1940   // If we have lifetime, that dominates.
   1941   if (Qualifiers::ObjCLifetime lifetime = qs.getObjCLifetime()) {
   1942     assert(getLangOpts().ObjCAutoRefCount);
   1943 
   1944     switch (lifetime) {
   1945     case Qualifiers::OCL_None: llvm_unreachable("impossible");
   1946 
   1947     // These are just bits as far as the runtime is concerned.
   1948     case Qualifiers::OCL_ExplicitNone:
   1949     case Qualifiers::OCL_Autoreleasing:
   1950       return 0;
   1951 
   1952     // Tell the runtime that this is ARC __weak, called by the
   1953     // byref routines.
   1954     case Qualifiers::OCL_Weak: {
   1955       ARCWeakByrefHelpers byrefInfo(emission.Alignment);
   1956       return ::buildByrefHelpers(CGM, byrefType, byrefValueIndex, byrefInfo);
   1957     }
   1958 
   1959     // ARC __strong __block variables need to be retained.
   1960     case Qualifiers::OCL_Strong:
   1961       // Block pointers need to be copied, and there's no direct
   1962       // transfer possible.
   1963       if (type->isBlockPointerType()) {
   1964         ARCStrongBlockByrefHelpers byrefInfo(emission.Alignment);
   1965         return ::buildByrefHelpers(CGM, byrefType, byrefValueIndex, byrefInfo);
   1966 
   1967       // Otherwise, we transfer ownership of the retain from the stack
   1968       // to the heap.
   1969       } else {
   1970         ARCStrongByrefHelpers byrefInfo(emission.Alignment);
   1971         return ::buildByrefHelpers(CGM, byrefType, byrefValueIndex, byrefInfo);
   1972       }
   1973     }
   1974     llvm_unreachable("fell out of lifetime switch!");
   1975   }
   1976 
   1977   BlockFieldFlags flags;
   1978   if (type->isBlockPointerType()) {
   1979     flags |= BLOCK_FIELD_IS_BLOCK;
   1980   } else if (CGM.getContext().isObjCNSObjectType(type) ||
   1981              type->isObjCObjectPointerType()) {
   1982     flags |= BLOCK_FIELD_IS_OBJECT;
   1983   } else {
   1984     return 0;
   1985   }
   1986 
   1987   if (type.isObjCGCWeak())
   1988     flags |= BLOCK_FIELD_IS_WEAK;
   1989 
   1990   ObjectByrefHelpers byrefInfo(emission.Alignment, flags);
   1991   return ::buildByrefHelpers(CGM, byrefType, byrefValueIndex, byrefInfo);
   1992 }
   1993 
   1994 unsigned CodeGenFunction::getByRefValueLLVMField(const ValueDecl *VD) const {
   1995   assert(ByRefValueInfo.count(VD) && "Did not find value!");
   1996 
   1997   return ByRefValueInfo.find(VD)->second.second;
   1998 }
   1999 
   2000 llvm::Value *CodeGenFunction::BuildBlockByrefAddress(llvm::Value *BaseAddr,
   2001                                                      const VarDecl *V) {
   2002   llvm::Value *Loc = Builder.CreateStructGEP(BaseAddr, 1, "forwarding");
   2003   Loc = Builder.CreateLoad(Loc);
   2004   Loc = Builder.CreateStructGEP(Loc, getByRefValueLLVMField(V),
   2005                                 V->getNameAsString());
   2006   return Loc;
   2007 }
   2008 
   2009 /// BuildByRefType - This routine changes a __block variable declared as T x
   2010 ///   into:
   2011 ///
   2012 ///      struct {
   2013 ///        void *__isa;
   2014 ///        void *__forwarding;
   2015 ///        int32_t __flags;
   2016 ///        int32_t __size;
   2017 ///        void *__copy_helper;       // only if needed
   2018 ///        void *__destroy_helper;    // only if needed
   2019 ///        void *__byref_variable_layout;// only if needed
   2020 ///        char padding[X];           // only if needed
   2021 ///        T x;
   2022 ///      } x
   2023 ///
   2024 llvm::Type *CodeGenFunction::BuildByRefType(const VarDecl *D) {
   2025   std::pair<llvm::Type *, unsigned> &Info = ByRefValueInfo[D];
   2026   if (Info.first)
   2027     return Info.first;
   2028 
   2029   QualType Ty = D->getType();
   2030 
   2031   SmallVector<llvm::Type *, 8> types;
   2032 
   2033   llvm::StructType *ByRefType =
   2034     llvm::StructType::create(getLLVMContext(),
   2035                              "struct.__block_byref_" + D->getNameAsString());
   2036 
   2037   // void *__isa;
   2038   types.push_back(Int8PtrTy);
   2039 
   2040   // void *__forwarding;
   2041   types.push_back(llvm::PointerType::getUnqual(ByRefType));
   2042 
   2043   // int32_t __flags;
   2044   types.push_back(Int32Ty);
   2045 
   2046   // int32_t __size;
   2047   types.push_back(Int32Ty);
   2048   // Note that this must match *exactly* the logic in buildByrefHelpers.
   2049   bool HasCopyAndDispose = getContext().BlockRequiresCopying(Ty, D);
   2050   if (HasCopyAndDispose) {
   2051     /// void *__copy_helper;
   2052     types.push_back(Int8PtrTy);
   2053 
   2054     /// void *__destroy_helper;
   2055     types.push_back(Int8PtrTy);
   2056   }
   2057   bool HasByrefExtendedLayout = false;
   2058   Qualifiers::ObjCLifetime Lifetime;
   2059   if (getContext().getByrefLifetime(Ty, Lifetime, HasByrefExtendedLayout) &&
   2060       HasByrefExtendedLayout)
   2061     /// void *__byref_variable_layout;
   2062     types.push_back(Int8PtrTy);
   2063 
   2064   bool Packed = false;
   2065   CharUnits Align = getContext().getDeclAlign(D);
   2066   if (Align >
   2067       getContext().toCharUnitsFromBits(getTarget().getPointerAlign(0))) {
   2068     // We have to insert padding.
   2069 
   2070     // The struct above has 2 32-bit integers.
   2071     unsigned CurrentOffsetInBytes = 4 * 2;
   2072 
   2073     // And either 2, 3, 4 or 5 pointers.
   2074     unsigned noPointers = 2;
   2075     if (HasCopyAndDispose)
   2076       noPointers += 2;
   2077     if (HasByrefExtendedLayout)
   2078       noPointers += 1;
   2079 
   2080     CurrentOffsetInBytes += noPointers * CGM.getDataLayout().getTypeAllocSize(Int8PtrTy);
   2081 
   2082     // Align the offset.
   2083     unsigned AlignedOffsetInBytes =
   2084       llvm::RoundUpToAlignment(CurrentOffsetInBytes, Align.getQuantity());
   2085 
   2086     unsigned NumPaddingBytes = AlignedOffsetInBytes - CurrentOffsetInBytes;
   2087     if (NumPaddingBytes > 0) {
   2088       llvm::Type *Ty = Int8Ty;
   2089       // FIXME: We need a sema error for alignment larger than the minimum of
   2090       // the maximal stack alignment and the alignment of malloc on the system.
   2091       if (NumPaddingBytes > 1)
   2092         Ty = llvm::ArrayType::get(Ty, NumPaddingBytes);
   2093 
   2094       types.push_back(Ty);
   2095 
   2096       // We want a packed struct.
   2097       Packed = true;
   2098     }
   2099   }
   2100 
   2101   // T x;
   2102   types.push_back(ConvertTypeForMem(Ty));
   2103 
   2104   ByRefType->setBody(types, Packed);
   2105 
   2106   Info.first = ByRefType;
   2107 
   2108   Info.second = types.size() - 1;
   2109 
   2110   return Info.first;
   2111 }
   2112 
   2113 /// Initialize the structural components of a __block variable, i.e.
   2114 /// everything but the actual object.
   2115 void CodeGenFunction::emitByrefStructureInit(const AutoVarEmission &emission) {
   2116   // Find the address of the local.
   2117   llvm::Value *addr = emission.Address;
   2118 
   2119   // That's an alloca of the byref structure type.
   2120   llvm::StructType *byrefType = cast<llvm::StructType>(
   2121                  cast<llvm::PointerType>(addr->getType())->getElementType());
   2122 
   2123   // Build the byref helpers if necessary.  This is null if we don't need any.
   2124   CodeGenModule::ByrefHelpers *helpers =
   2125     buildByrefHelpers(*byrefType, emission);
   2126 
   2127   const VarDecl &D = *emission.Variable;
   2128   QualType type = D.getType();
   2129 
   2130   bool HasByrefExtendedLayout;
   2131   Qualifiers::ObjCLifetime ByrefLifetime;
   2132   bool ByRefHasLifetime =
   2133     getContext().getByrefLifetime(type, ByrefLifetime, HasByrefExtendedLayout);
   2134 
   2135   llvm::Value *V;
   2136 
   2137   // Initialize the 'isa', which is just 0 or 1.
   2138   int isa = 0;
   2139   if (type.isObjCGCWeak())
   2140     isa = 1;
   2141   V = Builder.CreateIntToPtr(Builder.getInt32(isa), Int8PtrTy, "isa");
   2142   Builder.CreateStore(V, Builder.CreateStructGEP(addr, 0, "byref.isa"));
   2143 
   2144   // Store the address of the variable into its own forwarding pointer.
   2145   Builder.CreateStore(addr,
   2146                       Builder.CreateStructGEP(addr, 1, "byref.forwarding"));
   2147 
   2148   // Blocks ABI:
   2149   //   c) the flags field is set to either 0 if no helper functions are
   2150   //      needed or BLOCK_BYREF_HAS_COPY_DISPOSE if they are,
   2151   BlockFlags flags;
   2152   if (helpers) flags |= BLOCK_BYREF_HAS_COPY_DISPOSE;
   2153   if (ByRefHasLifetime) {
   2154     if (HasByrefExtendedLayout) flags |= BLOCK_BYREF_LAYOUT_EXTENDED;
   2155       else switch (ByrefLifetime) {
   2156         case Qualifiers::OCL_Strong:
   2157           flags |= BLOCK_BYREF_LAYOUT_STRONG;
   2158           break;
   2159         case Qualifiers::OCL_Weak:
   2160           flags |= BLOCK_BYREF_LAYOUT_WEAK;
   2161           break;
   2162         case Qualifiers::OCL_ExplicitNone:
   2163           flags |= BLOCK_BYREF_LAYOUT_UNRETAINED;
   2164           break;
   2165         case Qualifiers::OCL_None:
   2166           if (!type->isObjCObjectPointerType() && !type->isBlockPointerType())
   2167             flags |= BLOCK_BYREF_LAYOUT_NON_OBJECT;
   2168           break;
   2169         default:
   2170           break;
   2171       }
   2172     if (CGM.getLangOpts().ObjCGCBitmapPrint) {
   2173       printf("\n Inline flag for BYREF variable layout (%d):", flags.getBitMask());
   2174       if (flags & BLOCK_BYREF_HAS_COPY_DISPOSE)
   2175         printf(" BLOCK_BYREF_HAS_COPY_DISPOSE");
   2176       if (flags & BLOCK_BYREF_LAYOUT_MASK) {
   2177         BlockFlags ThisFlag(flags.getBitMask() & BLOCK_BYREF_LAYOUT_MASK);
   2178         if (ThisFlag ==  BLOCK_BYREF_LAYOUT_EXTENDED)
   2179           printf(" BLOCK_BYREF_LAYOUT_EXTENDED");
   2180         if (ThisFlag ==  BLOCK_BYREF_LAYOUT_STRONG)
   2181           printf(" BLOCK_BYREF_LAYOUT_STRONG");
   2182         if (ThisFlag == BLOCK_BYREF_LAYOUT_WEAK)
   2183           printf(" BLOCK_BYREF_LAYOUT_WEAK");
   2184         if (ThisFlag == BLOCK_BYREF_LAYOUT_UNRETAINED)
   2185           printf(" BLOCK_BYREF_LAYOUT_UNRETAINED");
   2186         if (ThisFlag == BLOCK_BYREF_LAYOUT_NON_OBJECT)
   2187           printf(" BLOCK_BYREF_LAYOUT_NON_OBJECT");
   2188       }
   2189       printf("\n");
   2190     }
   2191   }
   2192 
   2193   Builder.CreateStore(llvm::ConstantInt::get(IntTy, flags.getBitMask()),
   2194                       Builder.CreateStructGEP(addr, 2, "byref.flags"));
   2195 
   2196   CharUnits byrefSize = CGM.GetTargetTypeStoreSize(byrefType);
   2197   V = llvm::ConstantInt::get(IntTy, byrefSize.getQuantity());
   2198   Builder.CreateStore(V, Builder.CreateStructGEP(addr, 3, "byref.size"));
   2199 
   2200   if (helpers) {
   2201     llvm::Value *copy_helper = Builder.CreateStructGEP(addr, 4);
   2202     Builder.CreateStore(helpers->CopyHelper, copy_helper);
   2203 
   2204     llvm::Value *destroy_helper = Builder.CreateStructGEP(addr, 5);
   2205     Builder.CreateStore(helpers->DisposeHelper, destroy_helper);
   2206   }
   2207   if (ByRefHasLifetime && HasByrefExtendedLayout) {
   2208     llvm::Constant* ByrefLayoutInfo = CGM.getObjCRuntime().BuildByrefLayout(CGM, type);
   2209     llvm::Value *ByrefInfoAddr = Builder.CreateStructGEP(addr, helpers ? 6 : 4,
   2210                                                          "byref.layout");
   2211     // cast destination to pointer to source type.
   2212     llvm::Type *DesTy = ByrefLayoutInfo->getType();
   2213     DesTy = DesTy->getPointerTo();
   2214     llvm::Value *BC = Builder.CreatePointerCast(ByrefInfoAddr, DesTy);
   2215     Builder.CreateStore(ByrefLayoutInfo, BC);
   2216   }
   2217 }
   2218 
   2219 void CodeGenFunction::BuildBlockRelease(llvm::Value *V, BlockFieldFlags flags) {
   2220   llvm::Value *F = CGM.getBlockObjectDispose();
   2221   llvm::Value *args[] = {
   2222     Builder.CreateBitCast(V, Int8PtrTy),
   2223     llvm::ConstantInt::get(Int32Ty, flags.getBitMask())
   2224   };
   2225   EmitNounwindRuntimeCall(F, args); // FIXME: throwing destructors?
   2226 }
   2227 
   2228 namespace {
   2229   struct CallBlockRelease : EHScopeStack::Cleanup {
   2230     llvm::Value *Addr;
   2231     CallBlockRelease(llvm::Value *Addr) : Addr(Addr) {}
   2232 
   2233     void Emit(CodeGenFunction &CGF, Flags flags) {
   2234       // Should we be passing FIELD_IS_WEAK here?
   2235       CGF.BuildBlockRelease(Addr, BLOCK_FIELD_IS_BYREF);
   2236     }
   2237   };
   2238 }
   2239 
   2240 /// Enter a cleanup to destroy a __block variable.  Note that this
   2241 /// cleanup should be a no-op if the variable hasn't left the stack
   2242 /// yet; if a cleanup is required for the variable itself, that needs
   2243 /// to be done externally.
   2244 void CodeGenFunction::enterByrefCleanup(const AutoVarEmission &emission) {
   2245   // We don't enter this cleanup if we're in pure-GC mode.
   2246   if (CGM.getLangOpts().getGC() == LangOptions::GCOnly)
   2247     return;
   2248 
   2249   EHStack.pushCleanup<CallBlockRelease>(NormalAndEHCleanup, emission.Address);
   2250 }
   2251 
   2252 /// Adjust the declaration of something from the blocks API.
   2253 static void configureBlocksRuntimeObject(CodeGenModule &CGM,
   2254                                          llvm::Constant *C) {
   2255   if (!CGM.getLangOpts().BlocksRuntimeOptional) return;
   2256 
   2257   llvm::GlobalValue *GV = cast<llvm::GlobalValue>(C->stripPointerCasts());
   2258   if (GV->isDeclaration() &&
   2259       GV->getLinkage() == llvm::GlobalValue::ExternalLinkage)
   2260     GV->setLinkage(llvm::GlobalValue::ExternalWeakLinkage);
   2261 }
   2262 
   2263 llvm::Constant *CodeGenModule::getBlockObjectDispose() {
   2264   if (BlockObjectDispose)
   2265     return BlockObjectDispose;
   2266 
   2267   llvm::Type *args[] = { Int8PtrTy, Int32Ty };
   2268   llvm::FunctionType *fty
   2269     = llvm::FunctionType::get(VoidTy, args, false);
   2270   BlockObjectDispose = CreateRuntimeFunction(fty, "_Block_object_dispose");
   2271   configureBlocksRuntimeObject(*this, BlockObjectDispose);
   2272   return BlockObjectDispose;
   2273 }
   2274 
   2275 llvm::Constant *CodeGenModule::getBlockObjectAssign() {
   2276   if (BlockObjectAssign)
   2277     return BlockObjectAssign;
   2278 
   2279   llvm::Type *args[] = { Int8PtrTy, Int8PtrTy, Int32Ty };
   2280   llvm::FunctionType *fty
   2281     = llvm::FunctionType::get(VoidTy, args, false);
   2282   BlockObjectAssign = CreateRuntimeFunction(fty, "_Block_object_assign");
   2283   configureBlocksRuntimeObject(*this, BlockObjectAssign);
   2284   return BlockObjectAssign;
   2285 }
   2286 
   2287 llvm::Constant *CodeGenModule::getNSConcreteGlobalBlock() {
   2288   if (NSConcreteGlobalBlock)
   2289     return NSConcreteGlobalBlock;
   2290 
   2291   NSConcreteGlobalBlock = GetOrCreateLLVMGlobal("_NSConcreteGlobalBlock",
   2292                                                 Int8PtrTy->getPointerTo(), 0);
   2293   configureBlocksRuntimeObject(*this, NSConcreteGlobalBlock);
   2294   return NSConcreteGlobalBlock;
   2295 }
   2296 
   2297 llvm::Constant *CodeGenModule::getNSConcreteStackBlock() {
   2298   if (NSConcreteStackBlock)
   2299     return NSConcreteStackBlock;
   2300 
   2301   NSConcreteStackBlock = GetOrCreateLLVMGlobal("_NSConcreteStackBlock",
   2302                                                Int8PtrTy->getPointerTo(), 0);
   2303   configureBlocksRuntimeObject(*this, NSConcreteStackBlock);
   2304   return NSConcreteStackBlock;
   2305 }
   2306