1 //===- ArchiveWriter.cpp - ar File Format implementation --------*- C++ -*-===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This file defines the writeArchive function. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "llvm/Object/ArchiveWriter.h" 15 #include "llvm/ADT/ArrayRef.h" 16 #include "llvm/ADT/StringRef.h" 17 #include "llvm/IR/LLVMContext.h" 18 #include "llvm/Object/Archive.h" 19 #include "llvm/Object/ObjectFile.h" 20 #include "llvm/Object/SymbolicFile.h" 21 #include "llvm/Support/EndianStream.h" 22 #include "llvm/Support/Errc.h" 23 #include "llvm/Support/ErrorHandling.h" 24 #include "llvm/Support/Format.h" 25 #include "llvm/Support/Path.h" 26 #include "llvm/Support/ToolOutputFile.h" 27 #include "llvm/Support/raw_ostream.h" 28 29 #if !defined(_MSC_VER) && !defined(__MINGW32__) 30 #include <unistd.h> 31 #else 32 #include <io.h> 33 #endif 34 35 using namespace llvm; 36 37 NewArchiveMember::NewArchiveMember(MemoryBufferRef BufRef) 38 : Buf(MemoryBuffer::getMemBuffer(BufRef, false)) {} 39 40 Expected<NewArchiveMember> 41 NewArchiveMember::getOldMember(const object::Archive::Child &OldMember, 42 bool Deterministic) { 43 Expected<llvm::MemoryBufferRef> BufOrErr = OldMember.getMemoryBufferRef(); 44 if (!BufOrErr) 45 return BufOrErr.takeError(); 46 47 NewArchiveMember M; 48 M.Buf = MemoryBuffer::getMemBuffer(*BufOrErr, false); 49 if (!Deterministic) { 50 auto ModTimeOrErr = OldMember.getLastModified(); 51 if (!ModTimeOrErr) 52 return ModTimeOrErr.takeError(); 53 M.ModTime = ModTimeOrErr.get(); 54 Expected<unsigned> UIDOrErr = OldMember.getUID(); 55 if (!UIDOrErr) 56 return UIDOrErr.takeError(); 57 M.UID = UIDOrErr.get(); 58 Expected<unsigned> GIDOrErr = OldMember.getGID(); 59 if (!GIDOrErr) 60 return GIDOrErr.takeError(); 61 M.GID = GIDOrErr.get(); 62 Expected<sys::fs::perms> AccessModeOrErr = OldMember.getAccessMode(); 63 if (!AccessModeOrErr) 64 return AccessModeOrErr.takeError(); 65 M.Perms = AccessModeOrErr.get(); 66 } 67 return std::move(M); 68 } 69 70 Expected<NewArchiveMember> NewArchiveMember::getFile(StringRef FileName, 71 bool Deterministic) { 72 sys::fs::file_status Status; 73 int FD; 74 if (auto EC = sys::fs::openFileForRead(FileName, FD)) 75 return errorCodeToError(EC); 76 assert(FD != -1); 77 78 if (auto EC = sys::fs::status(FD, Status)) 79 return errorCodeToError(EC); 80 81 // Opening a directory doesn't make sense. Let it fail. 82 // Linux cannot open directories with open(2), although 83 // cygwin and *bsd can. 84 if (Status.type() == sys::fs::file_type::directory_file) 85 return errorCodeToError(make_error_code(errc::is_a_directory)); 86 87 ErrorOr<std::unique_ptr<MemoryBuffer>> MemberBufferOrErr = 88 MemoryBuffer::getOpenFile(FD, FileName, Status.getSize(), false); 89 if (!MemberBufferOrErr) 90 return errorCodeToError(MemberBufferOrErr.getError()); 91 92 if (close(FD) != 0) 93 return errorCodeToError(std::error_code(errno, std::generic_category())); 94 95 NewArchiveMember M; 96 M.Buf = std::move(*MemberBufferOrErr); 97 if (!Deterministic) { 98 M.ModTime = std::chrono::time_point_cast<std::chrono::seconds>( 99 Status.getLastModificationTime()); 100 M.UID = Status.getUser(); 101 M.GID = Status.getGroup(); 102 M.Perms = Status.permissions(); 103 } 104 return std::move(M); 105 } 106 107 template <typename T> 108 static void printWithSpacePadding(raw_fd_ostream &OS, T Data, unsigned Size, 109 bool MayTruncate = false) { 110 uint64_t OldPos = OS.tell(); 111 OS << Data; 112 unsigned SizeSoFar = OS.tell() - OldPos; 113 if (Size > SizeSoFar) { 114 OS.indent(Size - SizeSoFar); 115 } else if (Size < SizeSoFar) { 116 assert(MayTruncate && "Data doesn't fit in Size"); 117 // Some of the data this is used for (like UID) can be larger than the 118 // space available in the archive format. Truncate in that case. 119 OS.seek(OldPos + Size); 120 } 121 } 122 123 static void print32(raw_ostream &Out, object::Archive::Kind Kind, 124 uint32_t Val) { 125 if (Kind == object::Archive::K_GNU) 126 support::endian::Writer<support::big>(Out).write(Val); 127 else 128 support::endian::Writer<support::little>(Out).write(Val); 129 } 130 131 static void printRestOfMemberHeader( 132 raw_fd_ostream &Out, const sys::TimePoint<std::chrono::seconds> &ModTime, 133 unsigned UID, unsigned GID, unsigned Perms, unsigned Size) { 134 printWithSpacePadding(Out, sys::toTimeT(ModTime), 12); 135 printWithSpacePadding(Out, UID, 6, true); 136 printWithSpacePadding(Out, GID, 6, true); 137 printWithSpacePadding(Out, format("%o", Perms), 8); 138 printWithSpacePadding(Out, Size, 10); 139 Out << "`\n"; 140 } 141 142 static void 143 printGNUSmallMemberHeader(raw_fd_ostream &Out, StringRef Name, 144 const sys::TimePoint<std::chrono::seconds> &ModTime, 145 unsigned UID, unsigned GID, unsigned Perms, 146 unsigned Size) { 147 printWithSpacePadding(Out, Twine(Name) + "/", 16); 148 printRestOfMemberHeader(Out, ModTime, UID, GID, Perms, Size); 149 } 150 151 static void 152 printBSDMemberHeader(raw_fd_ostream &Out, StringRef Name, 153 const sys::TimePoint<std::chrono::seconds> &ModTime, 154 unsigned UID, unsigned GID, unsigned Perms, 155 unsigned Size) { 156 uint64_t PosAfterHeader = Out.tell() + 60 + Name.size(); 157 // Pad so that even 64 bit object files are aligned. 158 unsigned Pad = OffsetToAlignment(PosAfterHeader, 8); 159 unsigned NameWithPadding = Name.size() + Pad; 160 printWithSpacePadding(Out, Twine("#1/") + Twine(NameWithPadding), 16); 161 printRestOfMemberHeader(Out, ModTime, UID, GID, Perms, 162 NameWithPadding + Size); 163 Out << Name; 164 assert(PosAfterHeader == Out.tell()); 165 while (Pad--) 166 Out.write(uint8_t(0)); 167 } 168 169 static bool useStringTable(bool Thin, StringRef Name) { 170 return Thin || Name.size() >= 16; 171 } 172 173 static void 174 printMemberHeader(raw_fd_ostream &Out, object::Archive::Kind Kind, bool Thin, 175 StringRef Name, 176 std::vector<unsigned>::iterator &StringMapIndexIter, 177 const sys::TimePoint<std::chrono::seconds> &ModTime, 178 unsigned UID, unsigned GID, unsigned Perms, unsigned Size) { 179 if (Kind == object::Archive::K_BSD) 180 return printBSDMemberHeader(Out, Name, ModTime, UID, GID, Perms, Size); 181 if (!useStringTable(Thin, Name)) 182 return printGNUSmallMemberHeader(Out, Name, ModTime, UID, GID, Perms, Size); 183 Out << '/'; 184 printWithSpacePadding(Out, *StringMapIndexIter++, 15); 185 printRestOfMemberHeader(Out, ModTime, UID, GID, Perms, Size); 186 } 187 188 // Compute the relative path from From to To. 189 static std::string computeRelativePath(StringRef From, StringRef To) { 190 if (sys::path::is_absolute(From) || sys::path::is_absolute(To)) 191 return To; 192 193 StringRef DirFrom = sys::path::parent_path(From); 194 auto FromI = sys::path::begin(DirFrom); 195 auto ToI = sys::path::begin(To); 196 while (*FromI == *ToI) { 197 ++FromI; 198 ++ToI; 199 } 200 201 SmallString<128> Relative; 202 for (auto FromE = sys::path::end(DirFrom); FromI != FromE; ++FromI) 203 sys::path::append(Relative, ".."); 204 205 for (auto ToE = sys::path::end(To); ToI != ToE; ++ToI) 206 sys::path::append(Relative, *ToI); 207 208 #ifdef LLVM_ON_WIN32 209 // Replace backslashes with slashes so that the path is portable between *nix 210 // and Windows. 211 std::replace(Relative.begin(), Relative.end(), '\\', '/'); 212 #endif 213 214 return Relative.str(); 215 } 216 217 static void writeStringTable(raw_fd_ostream &Out, StringRef ArcName, 218 ArrayRef<NewArchiveMember> Members, 219 std::vector<unsigned> &StringMapIndexes, 220 bool Thin) { 221 unsigned StartOffset = 0; 222 for (const NewArchiveMember &M : Members) { 223 StringRef Path = M.Buf->getBufferIdentifier(); 224 StringRef Name = sys::path::filename(Path); 225 if (!useStringTable(Thin, Name)) 226 continue; 227 if (StartOffset == 0) { 228 printWithSpacePadding(Out, "//", 58); 229 Out << "`\n"; 230 StartOffset = Out.tell(); 231 } 232 StringMapIndexes.push_back(Out.tell() - StartOffset); 233 234 if (Thin) 235 Out << computeRelativePath(ArcName, Path); 236 else 237 Out << Name; 238 239 Out << "/\n"; 240 } 241 if (StartOffset == 0) 242 return; 243 if (Out.tell() % 2) 244 Out << '\n'; 245 int Pos = Out.tell(); 246 Out.seek(StartOffset - 12); 247 printWithSpacePadding(Out, Pos - StartOffset, 10); 248 Out.seek(Pos); 249 } 250 251 static sys::TimePoint<std::chrono::seconds> now(bool Deterministic) { 252 using namespace std::chrono; 253 254 if (!Deterministic) 255 return time_point_cast<seconds>(system_clock::now()); 256 return sys::TimePoint<seconds>(); 257 } 258 259 // Returns the offset of the first reference to a member offset. 260 static ErrorOr<unsigned> 261 writeSymbolTable(raw_fd_ostream &Out, object::Archive::Kind Kind, 262 ArrayRef<NewArchiveMember> Members, 263 std::vector<unsigned> &MemberOffsetRefs, bool Deterministic) { 264 unsigned HeaderStartOffset = 0; 265 unsigned BodyStartOffset = 0; 266 SmallString<128> NameBuf; 267 raw_svector_ostream NameOS(NameBuf); 268 LLVMContext Context; 269 for (unsigned MemberNum = 0, N = Members.size(); MemberNum < N; ++MemberNum) { 270 MemoryBufferRef MemberBuffer = Members[MemberNum].Buf->getMemBufferRef(); 271 Expected<std::unique_ptr<object::SymbolicFile>> ObjOrErr = 272 object::SymbolicFile::createSymbolicFile( 273 MemberBuffer, sys::fs::file_magic::unknown, &Context); 274 if (!ObjOrErr) { 275 // FIXME: check only for "not an object file" errors. 276 consumeError(ObjOrErr.takeError()); 277 continue; 278 } 279 object::SymbolicFile &Obj = *ObjOrErr.get(); 280 281 if (!HeaderStartOffset) { 282 HeaderStartOffset = Out.tell(); 283 if (Kind == object::Archive::K_GNU) 284 printGNUSmallMemberHeader(Out, "", now(Deterministic), 0, 0, 0, 0); 285 else 286 printBSDMemberHeader(Out, "__.SYMDEF", now(Deterministic), 0, 0, 0, 0); 287 BodyStartOffset = Out.tell(); 288 print32(Out, Kind, 0); // number of entries or bytes 289 } 290 291 for (const object::BasicSymbolRef &S : Obj.symbols()) { 292 uint32_t Symflags = S.getFlags(); 293 if (Symflags & object::SymbolRef::SF_FormatSpecific) 294 continue; 295 if (!(Symflags & object::SymbolRef::SF_Global)) 296 continue; 297 if (Symflags & object::SymbolRef::SF_Undefined) 298 continue; 299 300 unsigned NameOffset = NameOS.tell(); 301 if (auto EC = S.printName(NameOS)) 302 return EC; 303 NameOS << '\0'; 304 MemberOffsetRefs.push_back(MemberNum); 305 if (Kind == object::Archive::K_BSD) 306 print32(Out, Kind, NameOffset); 307 print32(Out, Kind, 0); // member offset 308 } 309 } 310 311 if (HeaderStartOffset == 0) 312 return 0; 313 314 StringRef StringTable = NameOS.str(); 315 if (Kind == object::Archive::K_BSD) 316 print32(Out, Kind, StringTable.size()); // byte count of the string table 317 Out << StringTable; 318 319 // ld64 requires the next member header to start at an offset that is 320 // 4 bytes aligned. 321 unsigned Pad = OffsetToAlignment(Out.tell(), 4); 322 while (Pad--) 323 Out.write(uint8_t(0)); 324 325 // Patch up the size of the symbol table now that we know how big it is. 326 unsigned Pos = Out.tell(); 327 const unsigned MemberHeaderSize = 60; 328 Out.seek(HeaderStartOffset + 48); // offset of the size field. 329 printWithSpacePadding(Out, Pos - MemberHeaderSize - HeaderStartOffset, 10); 330 331 // Patch up the number of symbols. 332 Out.seek(BodyStartOffset); 333 unsigned NumSyms = MemberOffsetRefs.size(); 334 if (Kind == object::Archive::K_GNU) 335 print32(Out, Kind, NumSyms); 336 else 337 print32(Out, Kind, NumSyms * 8); 338 339 Out.seek(Pos); 340 return BodyStartOffset + 4; 341 } 342 343 std::pair<StringRef, std::error_code> 344 llvm::writeArchive(StringRef ArcName, 345 std::vector<NewArchiveMember> &NewMembers, 346 bool WriteSymtab, object::Archive::Kind Kind, 347 bool Deterministic, bool Thin, 348 std::unique_ptr<MemoryBuffer> OldArchiveBuf) { 349 assert((!Thin || Kind == object::Archive::K_GNU) && 350 "Only the gnu format has a thin mode"); 351 SmallString<128> TmpArchive; 352 int TmpArchiveFD; 353 if (auto EC = sys::fs::createUniqueFile(ArcName + ".temp-archive-%%%%%%%.a", 354 TmpArchiveFD, TmpArchive)) 355 return std::make_pair(ArcName, EC); 356 357 tool_output_file Output(TmpArchive, TmpArchiveFD); 358 raw_fd_ostream &Out = Output.os(); 359 if (Thin) 360 Out << "!<thin>\n"; 361 else 362 Out << "!<arch>\n"; 363 364 std::vector<unsigned> MemberOffsetRefs; 365 366 std::vector<std::unique_ptr<MemoryBuffer>> Buffers; 367 std::vector<MemoryBufferRef> Members; 368 std::vector<sys::fs::file_status> NewMemberStatus; 369 370 unsigned MemberReferenceOffset = 0; 371 if (WriteSymtab) { 372 ErrorOr<unsigned> MemberReferenceOffsetOrErr = writeSymbolTable( 373 Out, Kind, NewMembers, MemberOffsetRefs, Deterministic); 374 if (auto EC = MemberReferenceOffsetOrErr.getError()) 375 return std::make_pair(ArcName, EC); 376 MemberReferenceOffset = MemberReferenceOffsetOrErr.get(); 377 } 378 379 std::vector<unsigned> StringMapIndexes; 380 if (Kind != object::Archive::K_BSD) 381 writeStringTable(Out, ArcName, NewMembers, StringMapIndexes, Thin); 382 383 std::vector<unsigned>::iterator StringMapIndexIter = StringMapIndexes.begin(); 384 std::vector<unsigned> MemberOffset; 385 for (const NewArchiveMember &M : NewMembers) { 386 MemoryBufferRef File = M.Buf->getMemBufferRef(); 387 388 unsigned Pos = Out.tell(); 389 MemberOffset.push_back(Pos); 390 391 printMemberHeader(Out, Kind, Thin, 392 sys::path::filename(M.Buf->getBufferIdentifier()), 393 StringMapIndexIter, M.ModTime, M.UID, M.GID, M.Perms, 394 M.Buf->getBufferSize()); 395 396 if (!Thin) 397 Out << File.getBuffer(); 398 399 if (Out.tell() % 2) 400 Out << '\n'; 401 } 402 403 if (MemberReferenceOffset) { 404 Out.seek(MemberReferenceOffset); 405 for (unsigned MemberNum : MemberOffsetRefs) { 406 if (Kind == object::Archive::K_BSD) 407 Out.seek(Out.tell() + 4); // skip over the string offset 408 print32(Out, Kind, MemberOffset[MemberNum]); 409 } 410 } 411 412 Output.keep(); 413 Out.close(); 414 415 // At this point, we no longer need whatever backing memory 416 // was used to generate the NewMembers. On Windows, this buffer 417 // could be a mapped view of the file we want to replace (if 418 // we're updating an existing archive, say). In that case, the 419 // rename would still succeed, but it would leave behind a 420 // temporary file (actually the original file renamed) because 421 // a file cannot be deleted while there's a handle open on it, 422 // only renamed. So by freeing this buffer, this ensures that 423 // the last open handle on the destination file, if any, is 424 // closed before we attempt to rename. 425 OldArchiveBuf.reset(); 426 427 sys::fs::rename(TmpArchive, ArcName); 428 return std::make_pair("", std::error_code()); 429 } 430