Home | History | Annotate | Download | only in Object
      1 //===- ArchiveWriter.cpp - ar File Format implementation --------*- C++ -*-===//
      2 //
      3 //                     The LLVM Compiler Infrastructure
      4 //
      5 // This file is distributed under the University of Illinois Open Source
      6 // License. See LICENSE.TXT for details.
      7 //
      8 //===----------------------------------------------------------------------===//
      9 //
     10 // This file defines the writeArchive function.
     11 //
     12 //===----------------------------------------------------------------------===//
     13 
     14 #include "llvm/Object/ArchiveWriter.h"
     15 #include "llvm/ADT/ArrayRef.h"
     16 #include "llvm/ADT/StringRef.h"
     17 #include "llvm/IR/LLVMContext.h"
     18 #include "llvm/Object/Archive.h"
     19 #include "llvm/Object/ObjectFile.h"
     20 #include "llvm/Object/SymbolicFile.h"
     21 #include "llvm/Support/EndianStream.h"
     22 #include "llvm/Support/Errc.h"
     23 #include "llvm/Support/ErrorHandling.h"
     24 #include "llvm/Support/Format.h"
     25 #include "llvm/Support/Path.h"
     26 #include "llvm/Support/ToolOutputFile.h"
     27 #include "llvm/Support/raw_ostream.h"
     28 
     29 #if !defined(_MSC_VER) && !defined(__MINGW32__)
     30 #include <unistd.h>
     31 #else
     32 #include <io.h>
     33 #endif
     34 
     35 using namespace llvm;
     36 
     37 NewArchiveMember::NewArchiveMember(MemoryBufferRef BufRef)
     38     : Buf(MemoryBuffer::getMemBuffer(BufRef, false)) {}
     39 
     40 Expected<NewArchiveMember>
     41 NewArchiveMember::getOldMember(const object::Archive::Child &OldMember,
     42                                bool Deterministic) {
     43   ErrorOr<llvm::MemoryBufferRef> BufOrErr = OldMember.getMemoryBufferRef();
     44   if (!BufOrErr)
     45     return errorCodeToError(BufOrErr.getError());
     46 
     47   NewArchiveMember M;
     48   M.Buf = MemoryBuffer::getMemBuffer(*BufOrErr, false);
     49   if (!Deterministic) {
     50     M.ModTime = OldMember.getLastModified();
     51     M.UID = OldMember.getUID();
     52     M.GID = OldMember.getGID();
     53     M.Perms = OldMember.getAccessMode();
     54   }
     55   return std::move(M);
     56 }
     57 
     58 Expected<NewArchiveMember> NewArchiveMember::getFile(StringRef FileName,
     59                                                      bool Deterministic) {
     60   sys::fs::file_status Status;
     61   int FD;
     62   if (auto EC = sys::fs::openFileForRead(FileName, FD))
     63     return errorCodeToError(EC);
     64   assert(FD != -1);
     65 
     66   if (auto EC = sys::fs::status(FD, Status))
     67     return errorCodeToError(EC);
     68 
     69   // Opening a directory doesn't make sense. Let it fail.
     70   // Linux cannot open directories with open(2), although
     71   // cygwin and *bsd can.
     72   if (Status.type() == sys::fs::file_type::directory_file)
     73     return errorCodeToError(make_error_code(errc::is_a_directory));
     74 
     75   ErrorOr<std::unique_ptr<MemoryBuffer>> MemberBufferOrErr =
     76       MemoryBuffer::getOpenFile(FD, FileName, Status.getSize(), false);
     77   if (!MemberBufferOrErr)
     78     return errorCodeToError(MemberBufferOrErr.getError());
     79 
     80   if (close(FD) != 0)
     81     return errorCodeToError(std::error_code(errno, std::generic_category()));
     82 
     83   NewArchiveMember M;
     84   M.Buf = std::move(*MemberBufferOrErr);
     85   if (!Deterministic) {
     86     M.ModTime = Status.getLastModificationTime();
     87     M.UID = Status.getUser();
     88     M.GID = Status.getGroup();
     89     M.Perms = Status.permissions();
     90   }
     91   return std::move(M);
     92 }
     93 
     94 template <typename T>
     95 static void printWithSpacePadding(raw_fd_ostream &OS, T Data, unsigned Size,
     96                                   bool MayTruncate = false) {
     97   uint64_t OldPos = OS.tell();
     98   OS << Data;
     99   unsigned SizeSoFar = OS.tell() - OldPos;
    100   if (Size > SizeSoFar) {
    101     OS.indent(Size - SizeSoFar);
    102   } else if (Size < SizeSoFar) {
    103     assert(MayTruncate && "Data doesn't fit in Size");
    104     // Some of the data this is used for (like UID) can be larger than the
    105     // space available in the archive format. Truncate in that case.
    106     OS.seek(OldPos + Size);
    107   }
    108 }
    109 
    110 static void print32(raw_ostream &Out, object::Archive::Kind Kind,
    111                     uint32_t Val) {
    112   if (Kind == object::Archive::K_GNU)
    113     support::endian::Writer<support::big>(Out).write(Val);
    114   else
    115     support::endian::Writer<support::little>(Out).write(Val);
    116 }
    117 
    118 static void printRestOfMemberHeader(raw_fd_ostream &Out,
    119                                     const sys::TimeValue &ModTime, unsigned UID,
    120                                     unsigned GID, unsigned Perms,
    121                                     unsigned Size) {
    122   printWithSpacePadding(Out, ModTime.toEpochTime(), 12);
    123   printWithSpacePadding(Out, UID, 6, true);
    124   printWithSpacePadding(Out, GID, 6, true);
    125   printWithSpacePadding(Out, format("%o", Perms), 8);
    126   printWithSpacePadding(Out, Size, 10);
    127   Out << "`\n";
    128 }
    129 
    130 static void printGNUSmallMemberHeader(raw_fd_ostream &Out, StringRef Name,
    131                                       const sys::TimeValue &ModTime,
    132                                       unsigned UID, unsigned GID,
    133                                       unsigned Perms, unsigned Size) {
    134   printWithSpacePadding(Out, Twine(Name) + "/", 16);
    135   printRestOfMemberHeader(Out, ModTime, UID, GID, Perms, Size);
    136 }
    137 
    138 static void printBSDMemberHeader(raw_fd_ostream &Out, StringRef Name,
    139                                  const sys::TimeValue &ModTime, unsigned UID,
    140                                  unsigned GID, unsigned Perms, unsigned Size) {
    141   uint64_t PosAfterHeader = Out.tell() + 60 + Name.size();
    142   // Pad so that even 64 bit object files are aligned.
    143   unsigned Pad = OffsetToAlignment(PosAfterHeader, 8);
    144   unsigned NameWithPadding = Name.size() + Pad;
    145   printWithSpacePadding(Out, Twine("#1/") + Twine(NameWithPadding), 16);
    146   printRestOfMemberHeader(Out, ModTime, UID, GID, Perms,
    147                           NameWithPadding + Size);
    148   Out << Name;
    149   assert(PosAfterHeader == Out.tell());
    150   while (Pad--)
    151     Out.write(uint8_t(0));
    152 }
    153 
    154 static bool useStringTable(bool Thin, StringRef Name) {
    155   return Thin || Name.size() >= 16;
    156 }
    157 
    158 static void
    159 printMemberHeader(raw_fd_ostream &Out, object::Archive::Kind Kind, bool Thin,
    160                   StringRef Name,
    161                   std::vector<unsigned>::iterator &StringMapIndexIter,
    162                   const sys::TimeValue &ModTime, unsigned UID, unsigned GID,
    163                   unsigned Perms, unsigned Size) {
    164   if (Kind == object::Archive::K_BSD)
    165     return printBSDMemberHeader(Out, Name, ModTime, UID, GID, Perms, Size);
    166   if (!useStringTable(Thin, Name))
    167     return printGNUSmallMemberHeader(Out, Name, ModTime, UID, GID, Perms, Size);
    168   Out << '/';
    169   printWithSpacePadding(Out, *StringMapIndexIter++, 15);
    170   printRestOfMemberHeader(Out, ModTime, UID, GID, Perms, Size);
    171 }
    172 
    173 // Compute the relative path from From to To.
    174 static std::string computeRelativePath(StringRef From, StringRef To) {
    175   if (sys::path::is_absolute(From) || sys::path::is_absolute(To))
    176     return To;
    177 
    178   StringRef DirFrom = sys::path::parent_path(From);
    179   auto FromI = sys::path::begin(DirFrom);
    180   auto ToI = sys::path::begin(To);
    181   while (*FromI == *ToI) {
    182     ++FromI;
    183     ++ToI;
    184   }
    185 
    186   SmallString<128> Relative;
    187   for (auto FromE = sys::path::end(DirFrom); FromI != FromE; ++FromI)
    188     sys::path::append(Relative, "..");
    189 
    190   for (auto ToE = sys::path::end(To); ToI != ToE; ++ToI)
    191     sys::path::append(Relative, *ToI);
    192 
    193   return Relative.str();
    194 }
    195 
    196 static void writeStringTable(raw_fd_ostream &Out, StringRef ArcName,
    197                              ArrayRef<NewArchiveMember> Members,
    198                              std::vector<unsigned> &StringMapIndexes,
    199                              bool Thin) {
    200   unsigned StartOffset = 0;
    201   for (const NewArchiveMember &M : Members) {
    202     StringRef Path = M.Buf->getBufferIdentifier();
    203     StringRef Name = sys::path::filename(Path);
    204     if (!useStringTable(Thin, Name))
    205       continue;
    206     if (StartOffset == 0) {
    207       printWithSpacePadding(Out, "//", 58);
    208       Out << "`\n";
    209       StartOffset = Out.tell();
    210     }
    211     StringMapIndexes.push_back(Out.tell() - StartOffset);
    212 
    213     if (Thin)
    214       Out << computeRelativePath(ArcName, Path);
    215     else
    216       Out << Name;
    217 
    218     Out << "/\n";
    219   }
    220   if (StartOffset == 0)
    221     return;
    222   if (Out.tell() % 2)
    223     Out << '\n';
    224   int Pos = Out.tell();
    225   Out.seek(StartOffset - 12);
    226   printWithSpacePadding(Out, Pos - StartOffset, 10);
    227   Out.seek(Pos);
    228 }
    229 
    230 static sys::TimeValue now(bool Deterministic) {
    231   if (!Deterministic)
    232     return sys::TimeValue::now();
    233   sys::TimeValue TV;
    234   TV.fromEpochTime(0);
    235   return TV;
    236 }
    237 
    238 // Returns the offset of the first reference to a member offset.
    239 static ErrorOr<unsigned>
    240 writeSymbolTable(raw_fd_ostream &Out, object::Archive::Kind Kind,
    241                  ArrayRef<NewArchiveMember> Members,
    242                  std::vector<unsigned> &MemberOffsetRefs, bool Deterministic) {
    243   unsigned HeaderStartOffset = 0;
    244   unsigned BodyStartOffset = 0;
    245   SmallString<128> NameBuf;
    246   raw_svector_ostream NameOS(NameBuf);
    247   LLVMContext Context;
    248   for (unsigned MemberNum = 0, N = Members.size(); MemberNum < N; ++MemberNum) {
    249     MemoryBufferRef MemberBuffer = Members[MemberNum].Buf->getMemBufferRef();
    250     Expected<std::unique_ptr<object::SymbolicFile>> ObjOrErr =
    251         object::SymbolicFile::createSymbolicFile(
    252             MemberBuffer, sys::fs::file_magic::unknown, &Context);
    253     if (!ObjOrErr) {
    254       // FIXME: check only for "not an object file" errors.
    255       consumeError(ObjOrErr.takeError());
    256       continue;
    257     }
    258     object::SymbolicFile &Obj = *ObjOrErr.get();
    259 
    260     if (!HeaderStartOffset) {
    261       HeaderStartOffset = Out.tell();
    262       if (Kind == object::Archive::K_GNU)
    263         printGNUSmallMemberHeader(Out, "", now(Deterministic), 0, 0, 0, 0);
    264       else
    265         printBSDMemberHeader(Out, "__.SYMDEF", now(Deterministic), 0, 0, 0, 0);
    266       BodyStartOffset = Out.tell();
    267       print32(Out, Kind, 0); // number of entries or bytes
    268     }
    269 
    270     for (const object::BasicSymbolRef &S : Obj.symbols()) {
    271       uint32_t Symflags = S.getFlags();
    272       if (Symflags & object::SymbolRef::SF_FormatSpecific)
    273         continue;
    274       if (!(Symflags & object::SymbolRef::SF_Global))
    275         continue;
    276       if (Symflags & object::SymbolRef::SF_Undefined)
    277         continue;
    278 
    279       unsigned NameOffset = NameOS.tell();
    280       if (auto EC = S.printName(NameOS))
    281         return EC;
    282       NameOS << '\0';
    283       MemberOffsetRefs.push_back(MemberNum);
    284       if (Kind == object::Archive::K_BSD)
    285         print32(Out, Kind, NameOffset);
    286       print32(Out, Kind, 0); // member offset
    287     }
    288   }
    289 
    290   if (HeaderStartOffset == 0)
    291     return 0;
    292 
    293   StringRef StringTable = NameOS.str();
    294   if (Kind == object::Archive::K_BSD)
    295     print32(Out, Kind, StringTable.size()); // byte count of the string table
    296   Out << StringTable;
    297 
    298   // ld64 requires the next member header to start at an offset that is
    299   // 4 bytes aligned.
    300   unsigned Pad = OffsetToAlignment(Out.tell(), 4);
    301   while (Pad--)
    302     Out.write(uint8_t(0));
    303 
    304   // Patch up the size of the symbol table now that we know how big it is.
    305   unsigned Pos = Out.tell();
    306   const unsigned MemberHeaderSize = 60;
    307   Out.seek(HeaderStartOffset + 48); // offset of the size field.
    308   printWithSpacePadding(Out, Pos - MemberHeaderSize - HeaderStartOffset, 10);
    309 
    310   // Patch up the number of symbols.
    311   Out.seek(BodyStartOffset);
    312   unsigned NumSyms = MemberOffsetRefs.size();
    313   if (Kind == object::Archive::K_GNU)
    314     print32(Out, Kind, NumSyms);
    315   else
    316     print32(Out, Kind, NumSyms * 8);
    317 
    318   Out.seek(Pos);
    319   return BodyStartOffset + 4;
    320 }
    321 
    322 std::pair<StringRef, std::error_code>
    323 llvm::writeArchive(StringRef ArcName,
    324                    std::vector<NewArchiveMember> &NewMembers,
    325                    bool WriteSymtab, object::Archive::Kind Kind,
    326                    bool Deterministic, bool Thin,
    327                    std::unique_ptr<MemoryBuffer> OldArchiveBuf) {
    328   assert((!Thin || Kind == object::Archive::K_GNU) &&
    329          "Only the gnu format has a thin mode");
    330   SmallString<128> TmpArchive;
    331   int TmpArchiveFD;
    332   if (auto EC = sys::fs::createUniqueFile(ArcName + ".temp-archive-%%%%%%%.a",
    333                                           TmpArchiveFD, TmpArchive))
    334     return std::make_pair(ArcName, EC);
    335 
    336   tool_output_file Output(TmpArchive, TmpArchiveFD);
    337   raw_fd_ostream &Out = Output.os();
    338   if (Thin)
    339     Out << "!<thin>\n";
    340   else
    341     Out << "!<arch>\n";
    342 
    343   std::vector<unsigned> MemberOffsetRefs;
    344 
    345   std::vector<std::unique_ptr<MemoryBuffer>> Buffers;
    346   std::vector<MemoryBufferRef> Members;
    347   std::vector<sys::fs::file_status> NewMemberStatus;
    348 
    349   unsigned MemberReferenceOffset = 0;
    350   if (WriteSymtab) {
    351     ErrorOr<unsigned> MemberReferenceOffsetOrErr = writeSymbolTable(
    352         Out, Kind, NewMembers, MemberOffsetRefs, Deterministic);
    353     if (auto EC = MemberReferenceOffsetOrErr.getError())
    354       return std::make_pair(ArcName, EC);
    355     MemberReferenceOffset = MemberReferenceOffsetOrErr.get();
    356   }
    357 
    358   std::vector<unsigned> StringMapIndexes;
    359   if (Kind != object::Archive::K_BSD)
    360     writeStringTable(Out, ArcName, NewMembers, StringMapIndexes, Thin);
    361 
    362   std::vector<unsigned>::iterator StringMapIndexIter = StringMapIndexes.begin();
    363   std::vector<unsigned> MemberOffset;
    364   for (const NewArchiveMember &M : NewMembers) {
    365     MemoryBufferRef File = M.Buf->getMemBufferRef();
    366 
    367     unsigned Pos = Out.tell();
    368     MemberOffset.push_back(Pos);
    369 
    370     printMemberHeader(Out, Kind, Thin,
    371                       sys::path::filename(M.Buf->getBufferIdentifier()),
    372                       StringMapIndexIter, M.ModTime, M.UID, M.GID, M.Perms,
    373                       M.Buf->getBufferSize());
    374 
    375     if (!Thin)
    376       Out << File.getBuffer();
    377 
    378     if (Out.tell() % 2)
    379       Out << '\n';
    380   }
    381 
    382   if (MemberReferenceOffset) {
    383     Out.seek(MemberReferenceOffset);
    384     for (unsigned MemberNum : MemberOffsetRefs) {
    385       if (Kind == object::Archive::K_BSD)
    386         Out.seek(Out.tell() + 4); // skip over the string offset
    387       print32(Out, Kind, MemberOffset[MemberNum]);
    388     }
    389   }
    390 
    391   Output.keep();
    392   Out.close();
    393 
    394   // At this point, we no longer need whatever backing memory
    395   // was used to generate the NewMembers. On Windows, this buffer
    396   // could be a mapped view of the file we want to replace (if
    397   // we're updating an existing archive, say). In that case, the
    398   // rename would still succeed, but it would leave behind a
    399   // temporary file (actually the original file renamed) because
    400   // a file cannot be deleted while there's a handle open on it,
    401   // only renamed. So by freeing this buffer, this ensures that
    402   // the last open handle on the destination file, if any, is
    403   // closed before we attempt to rename.
    404   OldArchiveBuf.reset();
    405 
    406   sys::fs::rename(TmpArchive, ArcName);
    407   return std::make_pair("", std::error_code());
    408 }
    409